data-science-document-ai 1.59.0__tar.gz → 1.60.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/PKG-INFO +1 -1
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/pyproject.toml +1 -1
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/evergreen/placeholders.json +4 -4
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/evergreen/prompt.txt +6 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/hapag-lloyd/placeholders.json +5 -5
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/hapag-lloyd/prompt.txt +2 -2
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/maersk/placeholders.json +7 -7
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/maersk/prompt.txt +4 -3
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/msc/placeholders.json +6 -6
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/msc/prompt.txt +2 -2
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/oocl/placeholders.json +8 -8
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/other/placeholders.json +10 -10
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/other/prompt.txt +3 -1
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/yangming/placeholders.json +8 -8
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/customsInvoice/other/placeholders.json +1 -1
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/customsInvoice/other/prompt.txt +6 -2
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/partnerInvoice/other/placeholders.json +1 -1
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/partnerInvoice/other/prompt.txt +6 -2
- data_science_document_ai-1.60.1/src/prompts/library/preprocessing/carrier/prompt.txt +5 -0
- data_science_document_ai-1.59.0/src/prompts/library/preprocessing/carrier/prompt.txt +0 -4
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/constants.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/constants_sandbox.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/docai.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/docai_processor_config.yaml +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/excel_processing.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/io.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/llm.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/log_setup.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/pdf_processing.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/postprocessing/common.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/postprocessing/postprocess_booking_confirmation.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/postprocessing/postprocess_commercial_invoice.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/postprocessing/postprocess_partner_invoice.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/arrivalNotice/other/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/arrivalNotice/other/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/oocl/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bookingConfirmation/yangming/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bundeskasse/other/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/bundeskasse/other/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/commercialInvoice/other/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/commercialInvoice/other/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/customsAssessment/other/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/customsAssessment/other/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/deliveryOrder/other/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/deliveryOrder/other/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/draftMbl/other/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/draftMbl/other/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/finalMbL/other/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/finalMbL/other/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/packingList/other/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/packingList/other/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/postprocessing/port_code/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/postprocessing/port_code/prompt_port_code.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/preprocessing/carrier/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/shippingInstruction/other/placeholders.json +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/library/shippingInstruction/other/prompt.txt +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/prompt_library.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/setup.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/tms.py +0 -0
- {data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/utils.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
[tool.poetry]
|
|
2
2
|
name = "data-science-document-ai"
|
|
3
|
-
version = "1.
|
|
3
|
+
version = "1.60.1"
|
|
4
4
|
description = "\"Document AI repo for data science\""
|
|
5
5
|
authors = ["Naomi Nguyen <naomi.nguyen@forto.com>", "Kumar Rajendrababu <kumar.rajendrababu@forto.com>", "Igor Tonko <igor.tonko@forto.com>", "Osman Demirel <osman.demirel@forto.com>"]
|
|
6
6
|
packages = [
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
"contractNumber": {
|
|
10
10
|
"type": "STRING",
|
|
11
11
|
"nullable": true,
|
|
12
|
-
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG."
|
|
12
|
+
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG. Shipment Id 'S' followed by 6, 7, or 8 digits e.g. S9486358 is not a contract number."
|
|
13
13
|
},
|
|
14
14
|
"pickUpTerminalCode": {
|
|
15
15
|
"type": "STRING",
|
|
@@ -21,7 +21,7 @@
|
|
|
21
21
|
"nullable": true,
|
|
22
22
|
"description": "The specific terminal where cargo is gated in especially Export terminal delivery address. E.g., FULL RETURN TO or Export terminal name."
|
|
23
23
|
},
|
|
24
|
-
"
|
|
24
|
+
"proformaDate": {
|
|
25
25
|
"type": "STRING",
|
|
26
26
|
"nullable": true,
|
|
27
27
|
"description": "The date considered to apply the rates and charges specified in the booking confirmation"
|
|
@@ -34,7 +34,7 @@
|
|
|
34
34
|
"gateInReference": {
|
|
35
35
|
"type": "STRING",
|
|
36
36
|
"nullable": true,
|
|
37
|
-
"description": "A reference code for cargo entering the terminal to drop the loaded cargo for Export. Sometimes it can be '
|
|
37
|
+
"description": "A reference code for cargo entering the terminal to drop the loaded cargo for Export. Sometimes it can be 'Booking Number'."
|
|
38
38
|
},
|
|
39
39
|
"mblNumber": {
|
|
40
40
|
"type": "STRING",
|
|
@@ -139,7 +139,7 @@
|
|
|
139
139
|
"carrierName": {
|
|
140
140
|
"type": "STRING",
|
|
141
141
|
"nullable": true,
|
|
142
|
-
"description": "The name of the carrier who issued the document e,g, Evergreen Line."
|
|
142
|
+
"description": "The name of the carrier who issued the document. Extract full name. e,g, Evergreen Line."
|
|
143
143
|
}
|
|
144
144
|
},
|
|
145
145
|
"required": ["bookingNumber", "transportLegs", "containers", "cyCutOff", "vgmCutOff", "siCutOff"]
|
|
@@ -17,6 +17,12 @@ For Import Shipment: The loaded container / cargo arrives at a port of discharge
|
|
|
17
17
|
- Populate fields as defined in the response schema.
|
|
18
18
|
- Use the data field description to understand the context of the data.
|
|
19
19
|
|
|
20
|
+
- Containers: Need to extract Depot details per Container Type. Multiple Containers entries may exist, capture all instances under "Containers".
|
|
21
|
+
- containerType: The type of container (e.g., 20FT, 40FT, 20ft, 40ft, 40HC, 20DC, etc...).
|
|
22
|
+
- pickupDepotCode: The code of the depot where the empty container is picked up.It is identified as Empty Pick Up AT Depot or Export Empty Pick Up Depot(s).
|
|
23
|
+
- dropOffDepotCode: The code of the depot where the empty container is dropped off. It is identified as Import Empty Drop Off Depot(s). Full Return To is not the drop off depot.
|
|
24
|
+
|
|
25
|
+
|
|
20
26
|
- transportLegs: Multiple Transport Legs entries may exist, capture all instances under "transportLegs". Make sure the order of the legs are important.
|
|
21
27
|
- eta: The estimated time of arrival for a specific leg.
|
|
22
28
|
- etd: The estimated time of departure for a specific leg. ETD DATE above the PORT OF DISCHARGING information.
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
"contractNumber": {
|
|
10
10
|
"type": "STRING",
|
|
11
11
|
"nullable": true,
|
|
12
|
-
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG."
|
|
12
|
+
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG. It can be mentioned as Contract No., Contract Reference, or Quotation No. Shipment Id 'S' followed by 6, 7, or 8 digits e.g. S9486358 is not a contract number."
|
|
13
13
|
},
|
|
14
14
|
"pickUpTerminalCode": {
|
|
15
15
|
"type": "STRING",
|
|
@@ -21,10 +21,10 @@
|
|
|
21
21
|
"nullable": true,
|
|
22
22
|
"description": "The specific terminal where cargo is gated in especially Export terminal delivery address. E.g., Export terminal delivery address, Export terminal location, or Export terminal name."
|
|
23
23
|
},
|
|
24
|
-
"
|
|
24
|
+
"proformaDate": {
|
|
25
25
|
"type": "STRING",
|
|
26
26
|
"nullable": true,
|
|
27
|
-
"description": "The date considered to apply the rates and charges specified in the booking confirmation"
|
|
27
|
+
"description": "The date considered to apply the rates and charges specified in the booking confirmation. Issue date is not a Proforma Date."
|
|
28
28
|
},
|
|
29
29
|
"cyCutOff": {
|
|
30
30
|
"type": "STRING",
|
|
@@ -34,7 +34,7 @@
|
|
|
34
34
|
"gateInReference": {
|
|
35
35
|
"type": "STRING",
|
|
36
36
|
"nullable": true,
|
|
37
|
-
"description": "A reference code for cargo entering the terminal to drop the loaded cargo for Export. Sometimes it can be '
|
|
37
|
+
"description": "A reference code for cargo entering the terminal to drop the loaded cargo for Export. Sometimes it can be 'Booking Number'."
|
|
38
38
|
},
|
|
39
39
|
"mblNumber": {
|
|
40
40
|
"type": "STRING",
|
|
@@ -139,7 +139,7 @@
|
|
|
139
139
|
"carrierName": {
|
|
140
140
|
"type": "STRING",
|
|
141
141
|
"nullable": true,
|
|
142
|
-
"description": "The name of the carrier who issued the document e,g, Hapag-Lloyd."
|
|
142
|
+
"description": "The name of the carrier who issued the document. Extract full name e,g, Hapag-Lloyd (Vietnam) Ltd."
|
|
143
143
|
}
|
|
144
144
|
},
|
|
145
145
|
"required": ["bookingNumber", "transportLegs", "containers", "cyCutOff", "vgmCutOff", "siCutOff"]
|
|
@@ -28,10 +28,10 @@ For Import Shipment: The loaded container / cargo arrives at a port of discharge
|
|
|
28
28
|
- vgmCutOff: The deadline for submitting the Verified Gross Mass of the cargo. It can be referred to as VGM cut-off, VGM Submission Deadline, Verified Gross Mass deadline
|
|
29
29
|
|
|
30
30
|
- carrierName and carrierAddress:
|
|
31
|
-
- Extract the name and address of the carrier who is the main parent company in the document.
|
|
31
|
+
- Extract the full name and address of the carrier who is the main parent company in the document.
|
|
32
32
|
- It can be found in the top section of the document, often near the logo or header.
|
|
33
33
|
- Example:
|
|
34
|
-
- "Hapag-Lloyd" for carrierName
|
|
34
|
+
- "Hapag-Lloyd" or "Hapag-Lloyd (China) LTD" for carrierName
|
|
35
35
|
- Hamburg, Germany, Poland, Italy, Vietnam, China etc... for carrierAddress
|
|
36
36
|
|
|
37
37
|
- transportLegs: Multiple Transport Legs entries may exist, capture all instances under "transportLegs". Make sure the order of the legs are important.
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
"contractNumber": {
|
|
10
10
|
"type": "STRING",
|
|
11
11
|
"nullable": true,
|
|
12
|
-
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG."
|
|
12
|
+
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG. Shipment Id 'S' followed by 6, 7, or 8 digits e.g. S9486358 is not a contract number."
|
|
13
13
|
},
|
|
14
14
|
"pickUpTerminalCode": {
|
|
15
15
|
"type": "STRING",
|
|
@@ -21,10 +21,10 @@
|
|
|
21
21
|
"nullable": true,
|
|
22
22
|
"description": "The specific terminal where cargo is gated in especially Export terminal delivery address. E.g., Export terminal delivery address, Export terminal location, or Return Equip Delivery Terminal."
|
|
23
23
|
},
|
|
24
|
-
"
|
|
24
|
+
"proformaDate": {
|
|
25
25
|
"type": "STRING",
|
|
26
26
|
"nullable": true,
|
|
27
|
-
"description": "The date considered to apply the rates and charges specified in the booking confirmation. It is mentioned as Price Calculation Date or
|
|
27
|
+
"description": "The date considered to apply the rates and charges specified in the booking confirmation. It is mentioned as Price Calculation Date or proforma Date. Release Date, ETD, and ETA is not considered as proforma Date."
|
|
28
28
|
},
|
|
29
29
|
"cyCutOff": {
|
|
30
30
|
"type": "STRING",
|
|
@@ -34,12 +34,12 @@
|
|
|
34
34
|
"gateInReference": {
|
|
35
35
|
"type": "STRING",
|
|
36
36
|
"nullable": true,
|
|
37
|
-
"description": "A reference code for cargo entering the terminal to drop the loaded cargo for Export. Sometimes it can be '
|
|
37
|
+
"description": "A reference code for cargo entering the terminal to drop the loaded cargo for Export. Sometimes it can be 'Booking Number'."
|
|
38
38
|
},
|
|
39
39
|
"mblNumber": {
|
|
40
40
|
"type": "STRING",
|
|
41
41
|
"nullable": true,
|
|
42
|
-
"description": "Bill of Lading number (B/L NO.), a document issued by the carrier."
|
|
42
|
+
"description": "Master Bill of Lading number (B/L NO.), a document issued by the carrier. Commonly known as 'Bill of Lading Number', 'SEA WAYBILL', 'BILL OF LADING NO.', 'BL Number', 'BL No.', 'B/L No.', 'BL-Nr.', 'B/L', or 'HBL No.'"
|
|
43
43
|
},
|
|
44
44
|
"pickUpReference": {
|
|
45
45
|
"type": "STRING",
|
|
@@ -74,7 +74,7 @@
|
|
|
74
74
|
"dropOffDepotCode": {
|
|
75
75
|
"type": "STRING",
|
|
76
76
|
"nullable": true,
|
|
77
|
-
"description": "The depot code where the empty container will be dropped off."
|
|
77
|
+
"description": "The depot code where the empty container will be dropped off. Return Equip Delivery Terminal and Full Return Location is not the dropOffDepotCode."
|
|
78
78
|
}
|
|
79
79
|
}
|
|
80
80
|
},
|
|
@@ -139,7 +139,7 @@
|
|
|
139
139
|
"carrierName": {
|
|
140
140
|
"type": "STRING",
|
|
141
141
|
"nullable": true,
|
|
142
|
-
"description": "The name of the carrier who issued the document e,g, MAERSK."
|
|
142
|
+
"description": "The name of the carrier who issued the document. Extract the full name. e,g, MAERSK."
|
|
143
143
|
}
|
|
144
144
|
},
|
|
145
145
|
"required": ["bookingNumber", "transportLegs", "containers", "cyCutOff", "vgmCutOff", "siCutOff"]
|
|
@@ -24,18 +24,19 @@ For Import Shipment: The loaded container / cargo arrives at a port of discharge
|
|
|
24
24
|
- cyCutOff: The deadline for cargo to be delivered to the Container Yard. It can be referred to as Cargo Cut-off deadline, FCL delivery cut-off, CY CUT OFF, CY Closing - Latest Return Container Date.
|
|
25
25
|
- siCutOff: The deadline for submitting shipping instructions. It can be referred to as Shipping Instruction closing, SI Cut Off, Shipping Instruction deadline, INTENDED SI CUT-OFF
|
|
26
26
|
- vgmCutOff: The deadline for submitting the Verified Gross Mass of the cargo. It can be referred to as VGM cut-off, VGM Submission Deadline, Verified Gross Mass deadline
|
|
27
|
+
- Haulage Instructions Closing date in the second page is a cyCutOff but not siCutOff or vgmCutOff.
|
|
27
28
|
|
|
28
29
|
- carrierName and carrierAddress:
|
|
29
|
-
- Extract the name and address of the carrier who is the main parent company in the document.
|
|
30
|
+
- Extract the full name and address of the carrier who is the main parent company in the document.
|
|
30
31
|
- It can be found in the top section of the document, often near the logo or header.
|
|
31
32
|
- Example:
|
|
32
|
-
- "MAERSK" for carrierName
|
|
33
|
+
- "MAERSK" or "MAERSK Poland" for carrierName
|
|
33
34
|
- Hamburg, Germany, NETHERLANDS, Poland, Italy, Vietnam, China SHANGHAI BRANCH etc... for carrierAddress
|
|
34
35
|
|
|
35
36
|
- Containers: Need to extract Depot details per Container Type. Multiple Containers entries may exist, capture all instances under "Containers".
|
|
36
37
|
- containerType: The type of container (e.g., 20FT, 40FT, 20ft, 40ft, 40HC, 20DC, etc...).
|
|
37
38
|
- pickupDepotCode: The code of the depot where the empty container is picked up. Can be found as Empty Container Depot under Load Itinerary table.
|
|
38
|
-
- dropOffDepotCode: The code of the depot where the empty container is dropped off.
|
|
39
|
+
- dropOffDepotCode: The code of the depot where the empty container is dropped off. Return Equip Delivery Terminal and Full Return Location is not the dropOffDepotCode.
|
|
39
40
|
|
|
40
41
|
- transportLegs: Multiple Transport Legs entries may exist, capture all instances under "transportLegs". Make sure the order of the legs are important.
|
|
41
42
|
- eta: The estimated time of arrival for a specific leg.
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
"contractNumber": {
|
|
10
10
|
"type": "STRING",
|
|
11
11
|
"nullable": true,
|
|
12
|
-
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG. It can be found as Service Contract/Rate Reff. No."
|
|
12
|
+
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG. It can be found as Service Contract/Rate Reff. No. Shipment Id 'S' followed by 6, 7, or 8 digits e.g. S9486358 is not a contract number."
|
|
13
13
|
},
|
|
14
14
|
"pickUpTerminalCode": {
|
|
15
15
|
"type": "STRING",
|
|
@@ -21,10 +21,10 @@
|
|
|
21
21
|
"nullable": true,
|
|
22
22
|
"description": "The specific terminal where cargo is gated in especially Export terminal delivery address. It can be found as GATE IN AT TERMINAL/DEPOT"
|
|
23
23
|
},
|
|
24
|
-
"
|
|
24
|
+
"proformaDate": {
|
|
25
25
|
"type": "STRING",
|
|
26
26
|
"nullable": true,
|
|
27
|
-
"description": "The date considered to apply the rates and charges specified in the booking confirmation. It is mentioned as Price Calculation Date or
|
|
27
|
+
"description": "The date considered to apply the rates and charges specified in the booking confirmation. It is mentioned as Price Calculation Date or proforma Date."
|
|
28
28
|
},
|
|
29
29
|
"cyCutOff": {
|
|
30
30
|
"type": "STRING",
|
|
@@ -34,7 +34,7 @@
|
|
|
34
34
|
"gateInReference": {
|
|
35
35
|
"type": "STRING",
|
|
36
36
|
"nullable": true,
|
|
37
|
-
"description": "A reference code for cargo entering the terminal to drop the loaded cargo for Export. Sometimes it can be '
|
|
37
|
+
"description": "A reference code for cargo entering the terminal to drop the loaded cargo for Export. Sometimes it can be 'Booking Number'."
|
|
38
38
|
},
|
|
39
39
|
"mblNumber": {
|
|
40
40
|
"type": "STRING",
|
|
@@ -69,7 +69,7 @@
|
|
|
69
69
|
"pickUpDepotCode": {
|
|
70
70
|
"type": "STRING",
|
|
71
71
|
"nullable": true,
|
|
72
|
-
"description": "The depot code where the empty container will be picked up. It is identified as PICK UP AT DEPOT, Empty Container Depot, or Export Empty Pick Up Depot(s)."
|
|
72
|
+
"description": "The depot code where the empty container will be picked up. It is identified as PICK UP AT DEPOT, Empty Container Depot, or Export Empty Pick Up Depot(s). Do not extract the address here."
|
|
73
73
|
},
|
|
74
74
|
"dropOffDepotCode": {
|
|
75
75
|
"type": "STRING",
|
|
@@ -139,7 +139,7 @@
|
|
|
139
139
|
"carrierName": {
|
|
140
140
|
"type": "STRING",
|
|
141
141
|
"nullable": true,
|
|
142
|
-
"description": "The name of the carrier who issued the document e,g, MSC."
|
|
142
|
+
"description": "The name of the carrier who issued the document. Extract full name e,g, MSC or MSC POLAND SP. Z O.O. rather than just MSC."
|
|
143
143
|
}
|
|
144
144
|
},
|
|
145
145
|
"required": ["bookingNumber", "transportLegs", "containers", "cyCutOff", "vgmCutOff", "siCutOff"]
|
|
@@ -22,10 +22,10 @@ For Import Shipment: The loaded container / cargo arrives at a port of discharge
|
|
|
22
22
|
- cyCutOff: The deadline for cargo to be delivered to the Container Yard. It can be found at CUT-OFF(Date/Time), FCL delivery cut-off, CY CUT OFF, CY Closing.
|
|
23
23
|
|
|
24
24
|
- carrierName and carrierAddress:
|
|
25
|
-
- Extract the name and address of the carrier who is the main parent company in the document.
|
|
25
|
+
- Extract the full name and address of the carrier who is the main parent company in the document.
|
|
26
26
|
- It can be found in the top section of the document, often near the logo or header.
|
|
27
27
|
- Example:
|
|
28
|
-
- "MSC" for carrierName
|
|
28
|
+
- "MSC" or "MSC POLAND SP. Z O.O." for carrierName
|
|
29
29
|
- Hamburg, Germany, NETHERLANDS, Poland, Italy, Vietnam, China SHANGHAI BRANCH etc... for carrierAddress.
|
|
30
30
|
|
|
31
31
|
- Containers: Need to extract Depot details per Container Type. Multiple Containers entries may exist, capture all instances under "Containers".
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
"contractNumber": {
|
|
10
10
|
"type": "STRING",
|
|
11
11
|
"nullable": true,
|
|
12
|
-
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG. It can be referred as Rate Agreement Number or Contract No."
|
|
12
|
+
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG. It can be referred as Rate Agreement Number or Contract No.. Shipment Id 'S' followed by 6, 7, or 8 digits e.g. S9486358 is not a contract number."
|
|
13
13
|
},
|
|
14
14
|
"pickUpTerminalCode": {
|
|
15
15
|
"type": "STRING",
|
|
@@ -21,12 +21,7 @@
|
|
|
21
21
|
"nullable": true,
|
|
22
22
|
"description": "The specific terminal where cargo is gated in especially Export terminal delivery address. E.g., FULL RETURN LOCATION"
|
|
23
23
|
},
|
|
24
|
-
"
|
|
25
|
-
"type": "STRING",
|
|
26
|
-
"nullable": true,
|
|
27
|
-
"description": "The Shipping service code associated with the booking confirmation. It can be found as SERVICE CODE"
|
|
28
|
-
},
|
|
29
|
-
"performaDate": {
|
|
24
|
+
"proformaDate": {
|
|
30
25
|
"type": "STRING",
|
|
31
26
|
"nullable": true,
|
|
32
27
|
"description": "the date considered to apply the rates and charges specified in the booking confirmation"
|
|
@@ -114,6 +109,11 @@
|
|
|
114
109
|
"nullable": true,
|
|
115
110
|
"description": "The International Maritime Organization number for a specific leg. It can be found as IMO No, IMO number."
|
|
116
111
|
},
|
|
112
|
+
"serviceCode": {
|
|
113
|
+
"type": "STRING",
|
|
114
|
+
"nullable": true,
|
|
115
|
+
"description": "The Shipping service code associated with the booking confirmation. It can be found as SERVICE CODE"
|
|
116
|
+
},
|
|
117
117
|
"portOfDischarge": {
|
|
118
118
|
"type": "STRING",
|
|
119
119
|
"nullable": true,
|
|
@@ -153,7 +153,7 @@
|
|
|
153
153
|
"carrierName": {
|
|
154
154
|
"type": "STRING",
|
|
155
155
|
"nullable": true,
|
|
156
|
-
"description": "The name of the carrier who issued the document. E.g., OOCL or Orient Overseas Container Line Ltd."
|
|
156
|
+
"description": "The name of the carrier who issued the document. Extract the full name. E.g., OOCL or Orient Overseas Container Line Ltd."
|
|
157
157
|
}
|
|
158
158
|
},
|
|
159
159
|
"required": ["bookingNumber", "transportLegs", "containers", "cyCutOff", "vgmCutOff", "siCutOff"]
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
"contractNumber": {
|
|
10
10
|
"type": "STRING",
|
|
11
11
|
"nullable": true,
|
|
12
|
-
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG."
|
|
12
|
+
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG. Shipment Id 'S' followed by 6, 7, or 8 digits e.g. S9486358 is not a contract number."
|
|
13
13
|
},
|
|
14
14
|
"pickUpTerminalCode": {
|
|
15
15
|
"type": "STRING",
|
|
@@ -21,12 +21,7 @@
|
|
|
21
21
|
"nullable": true,
|
|
22
22
|
"description": "The specific terminal where cargo is gated in especially Export terminal delivery address. It can be found as Gate In At Terminal, Gate in Terminal, Full Return To Terminal, Full Return Location, Cargo Delivery At, Delivery Terminal, Full Return CY, eyc.."
|
|
23
23
|
},
|
|
24
|
-
"
|
|
25
|
-
"type": "STRING",
|
|
26
|
-
"nullable": true,
|
|
27
|
-
"description": "The Shipping service code associated with the booking confirmation. It is often referred to as 'Service Code'"
|
|
28
|
-
},
|
|
29
|
-
"performaDate": {
|
|
24
|
+
"proformaDate": {
|
|
30
25
|
"type": "STRING",
|
|
31
26
|
"nullable": true,
|
|
32
27
|
"description": "the date considered to apply the rates and charges specified in the booking confirmation"
|
|
@@ -44,12 +39,12 @@
|
|
|
44
39
|
"gateInReference": {
|
|
45
40
|
"type": "STRING",
|
|
46
41
|
"nullable": true,
|
|
47
|
-
"description": "A reference code for cargo entering the terminal to drop the loaded cargo for Export. Sometimes it can be load ref., Turn-in reference, or if nothing mentioned,
|
|
42
|
+
"description": "A reference code for cargo entering the terminal to drop the loaded cargo for Export. Sometimes it can be load ref., Turn-in reference, or if nothing mentioned, then use booking Number."
|
|
48
43
|
},
|
|
49
44
|
"mblNumber": {
|
|
50
45
|
"type": "STRING",
|
|
51
46
|
"nullable": true,
|
|
52
|
-
"description": "Bill of Lading number (B/L NO.), a document issued by the carrier."
|
|
47
|
+
"description": "Master Bill of Lading number (B/L NO.), a document issued by the carrier. Commonly known as 'Bill of Lading Number', 'SEA WAYBILL', 'BILL OF LADING NO.', 'BL Number', 'BL No.', 'B/L No.', 'BL-Nr.', 'B/L', or 'HBL No.'"
|
|
53
48
|
},
|
|
54
49
|
"pickUpReference": {
|
|
55
50
|
"type": "STRING",
|
|
@@ -114,6 +109,11 @@
|
|
|
114
109
|
"nullable": true,
|
|
115
110
|
"description": "The International Maritime Organization number for a specific leg. It can be found as IMO No, IMO number."
|
|
116
111
|
},
|
|
112
|
+
"serviceCode": {
|
|
113
|
+
"type": "STRING",
|
|
114
|
+
"nullable": true,
|
|
115
|
+
"description": "The Shipping service code associated with the booking confirmation. It is often referred to as 'Service Code'"
|
|
116
|
+
},
|
|
117
117
|
"portOfDischarge": {
|
|
118
118
|
"type": "STRING",
|
|
119
119
|
"nullable": true,
|
|
@@ -153,7 +153,7 @@
|
|
|
153
153
|
"carrierName": {
|
|
154
154
|
"type": "STRING",
|
|
155
155
|
"nullable": true,
|
|
156
|
-
"description": "The name of the carrier who issued the document. E.g,, Maersk, MSC, CMA CGM, Hapag-Lloyd, ONE, Evergreen etc."
|
|
156
|
+
"description": "The name of the carrier who issued the document. E.g,, Maersk, MSC, CMA CGM, Hapag-Lloyd, ONE, Evergreen etc. Sometimes, carriers like Shipco, Combitrac uses operating vessels from OOCL or Hapag-Lloyd, so in that case, the carrier name should be the one who issue the document (Shipco Transport (Shanghai) Ltd., Combitrac), not the operating vessel carrier (OOCL, Hapag-Lloyd)."
|
|
157
157
|
}
|
|
158
158
|
},
|
|
159
159
|
"required": ["bookingNumber", "transportLegs", "containers", "cyCutOff", "vgmCutOff", "siCutOff"]
|
|
@@ -29,8 +29,10 @@ For Import Shipment: The loaded container / cargo arrives at a port of discharge
|
|
|
29
29
|
|
|
30
30
|
- carrierName and carrierAddress:
|
|
31
31
|
- Extract the name and address of the carrier who is the main parent company in the document.
|
|
32
|
+
- Extract the complete name of the carrier including the entity location such as "Hapag-Lloyd Germany", "MSC Italy", "CMA CGM Vietnam" etc...
|
|
33
|
+
- Shipco Transport Ltd documents contain carrier: OOCL. Extract the carrier name "Other" but not OOCL.
|
|
32
34
|
- Example:
|
|
33
|
-
- "Hapag-Lloyd", "MSC", "CMA CGM", "ONE", "COSCO SHIPPING", "Evergreen", "Yang Ming", "ZIM", "PIL", "HMM" etc... for carrierName
|
|
35
|
+
- "Hapag-Lloyd", "MSC", "CMA CGM", "ONE", "Shipco Transport (Shanghai) Ltd.", "COSCO SHIPPING", "Evergreen", "Yang Ming", "ZIM", "PIL", "HMM" etc... for carrierName
|
|
34
36
|
- Hamburg, Germany, Poland, Italy, Vietnam, China etc... for carrierAddress
|
|
35
37
|
|
|
36
38
|
- Containers: Need to extract Depot details per Container Type. Multiple Containers entries may exist, capture all instances under "Containers".
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
"contractNumber": {
|
|
10
10
|
"type": "STRING",
|
|
11
11
|
"nullable": true,
|
|
12
|
-
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG.
|
|
12
|
+
"description": "It's a contract number between the carrier and Forto Logistics SE & Co KG. Shipment Id 'S' followed by 6, 7, or 8 digits e.g. S9486358 is not a contract number."
|
|
13
13
|
},
|
|
14
14
|
"pickUpTerminalCode": {
|
|
15
15
|
"type": "STRING",
|
|
@@ -21,12 +21,7 @@
|
|
|
21
21
|
"nullable": true,
|
|
22
22
|
"description": "The specific terminal where cargo is gated in especially Export terminal delivery address. It is mentioned as Delivery Terminal."
|
|
23
23
|
},
|
|
24
|
-
"
|
|
25
|
-
"type": "STRING",
|
|
26
|
-
"nullable": true,
|
|
27
|
-
"description": "The Shipping service code associated with the booking confirmation."
|
|
28
|
-
},
|
|
29
|
-
"performaDate": {
|
|
24
|
+
"proformaDate": {
|
|
30
25
|
"type": "STRING",
|
|
31
26
|
"nullable": true,
|
|
32
27
|
"description": "the date considered to apply the rates and charges specified in the booking confirmation"
|
|
@@ -114,6 +109,11 @@
|
|
|
114
109
|
"nullable": true,
|
|
115
110
|
"description": "The International Maritime Organization number for a specific leg. It can be found as IMO No, IMO number."
|
|
116
111
|
},
|
|
112
|
+
"serviceCode": {
|
|
113
|
+
"type": "STRING",
|
|
114
|
+
"nullable": true,
|
|
115
|
+
"description": "The Shipping service code associated with the booking confirmation. It is mentioned as SVC-NBR"
|
|
116
|
+
},
|
|
117
117
|
"portOfDischarge": {
|
|
118
118
|
"type": "STRING",
|
|
119
119
|
"nullable": true,
|
|
@@ -153,7 +153,7 @@
|
|
|
153
153
|
"carrierName": {
|
|
154
154
|
"type": "STRING",
|
|
155
155
|
"nullable": true,
|
|
156
|
-
"description": "The name of the carrier who issued the document."
|
|
156
|
+
"description": "The name of the carrier who issued the document. Extract full name. E.g., Yang Ming Marine Transport Corporation or Yang Ming Shipping EUROPE GmbH"
|
|
157
157
|
}
|
|
158
158
|
},
|
|
159
159
|
"required": ["bookingNumber", "transportLegs", "containers", "cyCutOff", "vgmCutOff", "siCutOff"]
|
|
@@ -31,7 +31,7 @@
|
|
|
31
31
|
},
|
|
32
32
|
"documentType": {"type": "STRING", "nullable": true},
|
|
33
33
|
"dueDate": {"type": "STRING", "nullable": true,
|
|
34
|
-
"description": "The date by which the payment should be made by Forto Logistics SE & Co KG.
|
|
34
|
+
"description": "The date by which the payment should be made by Forto Logistics SE & Co KG. If dueDate is not available in the invoice, calculate dueDate based on issueDate and paymentTerm."},
|
|
35
35
|
"eta": {"type": "STRING", "nullable": true,
|
|
36
36
|
"description": "Estimated Time of Arrival (ETA) is the expected date when the shipment will arrive at its destination."},
|
|
37
37
|
"etd": {"type": "STRING", "nullable": true,
|
|
@@ -46,7 +46,11 @@ Your role is to accurately extract specific entities from these invoices to supp
|
|
|
46
46
|
- CUSTOMS SUPPORT invoices do not have a vatAmount and vatPercentage.
|
|
47
47
|
|
|
48
48
|
- issueDate: The date the document was issued.
|
|
49
|
-
- dueDate:
|
|
49
|
+
- dueDate:
|
|
50
|
+
- The date by which the payment should be made. If dueDate is explicitly mentioned in the invoice, extract that value directly.
|
|
51
|
+
- If dueDate is not available in the invoice, calculate dueDate based on issueDate and paymentTerm.
|
|
52
|
+
- Example: If issueDate is 01.03.2023 and paymentTerm is 30 days, then dueDate will be 31.03.2023.
|
|
53
|
+
- If paymentTerm is not available, do not extract dueDate.
|
|
50
54
|
|
|
51
55
|
- lineItem: Details of each COGS and Customs line item on the invoice from each page. Make sure to extract each amount and currency separately.
|
|
52
56
|
- uniqueId: A unique id which associated with the lineItem as each line item can belong to a different shipment. Extract only if its available in the line item. Either a shipmentId starting with an S and followed by 6 or 8 numeric values or a mblNumber. If shipmentId or mblNumber does not exist, set it to containerNumber.
|
|
@@ -91,7 +95,7 @@ Your role is to accurately extract specific entities from these invoices to supp
|
|
|
91
95
|
- sentence: A sentence from the invoice indicating the payment status (e.g., "Vorschuss", "Prepayment", "Paid", "Partially Paid", "Unpaid"). This helps summarize the overall payment status of the invoice.
|
|
92
96
|
|
|
93
97
|
IMPORTANT NOTE:
|
|
94
|
-
- Ensure all extracted values are directly from the document. Do not make assumptions or
|
|
98
|
+
- Ensure all extracted values are directly from the document. Do not make assumptions, modifications or calculations except dueDate.
|
|
95
99
|
- CustomSized invoices contain line items in a table format in a attached page. Table with headings Shipment ID, Partner Line Item Description, Quantity, Amount, and VAT. Extract all the line items from each tables from each page.
|
|
96
100
|
- Do not normalize or modify any entity values.
|
|
97
101
|
- Pay attention to the line item details and paymentInformation, as they may vary significantly across different invoices.
|
|
@@ -29,7 +29,7 @@
|
|
|
29
29
|
},
|
|
30
30
|
"documentType": {"type": "STRING", "nullable": true},
|
|
31
31
|
"dueDate": {"type": "STRING", "nullable": true,
|
|
32
|
-
"description": "The date by which the payment should be made by Forto Logistics SE & Co KG.
|
|
32
|
+
"description": "The date by which the payment should be made by Forto Logistics SE & Co KG. If dueDate is not available in the invoice, calculate dueDate based on issueDate and paymentTerm."},
|
|
33
33
|
"eta": {"type": "STRING", "nullable": true,
|
|
34
34
|
"description": "Estimated Time of Arrival (ETA) is the expected date when the shipment will arrive at its destination."},
|
|
35
35
|
"etd": {"type": "STRING", "nullable": true,
|
|
@@ -42,7 +42,11 @@ Your role is to accurately extract specific entities from these invoices to supp
|
|
|
42
42
|
- Remove "TVA" characters from VAT ID in MSC invoices. For example, CHE-111.954.803 TVA should be extracted as CHE-111.954.803
|
|
43
43
|
|
|
44
44
|
- issueDate: The date the document was issued.
|
|
45
|
-
- dueDate:
|
|
45
|
+
- dueDate:
|
|
46
|
+
- The date by which the payment should be made. If dueDate is explicitly mentioned in the invoice, extract that value directly.
|
|
47
|
+
- If dueDate is not available in the invoice, calculate dueDate based on issueDate and paymentTerm.
|
|
48
|
+
- Example: If issueDate is 01.03.2023 and paymentTerm is 30 days, then dueDate will be 31.03.2023.
|
|
49
|
+
- If paymentTerm is not available, do not extract dueDate.
|
|
46
50
|
|
|
47
51
|
- eta and etd: Few invoices contains same date for ARRIVED/DEPARTED or ETA/ETD. Extract it for both eta and etd.
|
|
48
52
|
|
|
@@ -81,7 +85,7 @@ Your role is to accurately extract specific entities from these invoices to supp
|
|
|
81
85
|
- reverseChargeSentence: A sentence which indicate that the reverse charge applies. Mostly fund as Tax Clause.
|
|
82
86
|
|
|
83
87
|
IMPORTANT NOTE:
|
|
84
|
-
- Ensure all extracted values are directly from the document. Do not make assumptions, modifications or calculations.
|
|
88
|
+
- Ensure all extracted values are directly from the document. Do not make assumptions, modifications or calculations except dueDate.
|
|
85
89
|
- CustomSized invoices contain line items in a table format in the attached page. Table with headings Shipment ID, Partner Line Item Description, Quantity, Amount, and VAT. Extract all the line items from such tables from each page.
|
|
86
90
|
- Do not split the quantity into different line items. e.g., if quantity is 2 or 2 CTR or 2 BIL, do not create 2 separate line items with quantity 1 each.
|
|
87
91
|
- Do not normalize or modify any entity values.
|
|
@@ -0,0 +1,5 @@
|
|
|
1
|
+
You are a person who works for a freight-forwarder company.
|
|
2
|
+
Identify company that provided this DOCUMENT_TYPE_PLACEHOLDER document.
|
|
3
|
+
|
|
4
|
+
Identify the company only based on the name of the carrier mentioned in the top section of the document in the header, title.
|
|
5
|
+
Extract only if the carrier name is mentioned in the top header of the document. Else, classifiy it as "Other" because few carriers use a different carrier for shipping even though the document is issued by them.
|
|
File without changes
|
{data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/constants_sandbox.py
RENAMED
|
File without changes
|
|
File without changes
|
{data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/docai_processor_config.yaml
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/postprocessing/common.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{data_science_document_ai-1.59.0 → data_science_document_ai-1.60.1}/src/prompts/prompt_library.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|