Description
Hi , I am getting the data in the below format in the json file.
Could you please help me in extracting the following information from the below data.
------------------------------- JSON --------------------------------------------
{
“document”: {
“pages”: [
{
“pageNumber”: 1
}
],
“entities”: [
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “247”,
“endIndex”: “256”
}
],
“content”: “30-Apr-24”
},
“type”: “invoice_date”,
“mentionText”: “30-Apr-24”,
“confidence”: 0.96529007,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.76442593,
“y”: 0.21404542
},
{
“x”: 0.82331944,
“y”: 0.21404542
},
{
“x”: 0.82331944,
“y”: 0.22750211
},
{
“x”: 0.76442593,
“y”: 0.22750211
}
]
}
}
]
},
“id”: “0”,
“normalizedValue”: {
“text”: “2024-04-30”,
“dateValue”: {
“year”: 2024,
“month”: 4,
“day”: 30
}
}
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “1834”,
“endIndex”: “1843”
}
],
“content”: “16,110.00”
},
“type”: “total_amount”,
“mentionText”: “16,110.00”,
“confidence”: 0.94710624,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.8441404,
“y”: 0.764508
},
{
“x”: 0.9411065,
“y”: 0.764508
},
{
“x”: 0.9411065,
“y”: 0.7804878
},
{
“x”: 0.8441404,
“y”: 0.7804878
}
]
}
}
]
},
“id”: “1”,
“normalizedValue”: {
“text”: “16110”
}
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “1890”,
“endIndex”: “1899”
}
],
“content”: “29-Jun-24”
},
“type”: “due_date”,
“mentionText”: “29-Jun-24”,
“confidence”: 0.9443872,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.8839976,
“y”: 0.8061396
},
{
“x”: 0.94170135,
“y”: 0.8061396
},
{
“x”: 0.94170135,
“y”: 0.8179142
},
{
“x”: 0.8839976,
“y”: 0.8179142
}
]
}
}
]
},
“id”: “2”,
“normalizedValue”: {
“text”: “2024-06-29”,
“dateValue”: {
“year”: 2024,
“month”: 6,
“day”: 29
}
}
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “145”,
“endIndex”: “154”
}
],
“content”: “S01894912”
},
“type”: “invoice_id”,
“mentionText”: “S01894912”,
“confidence”: 0.92988557,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.20880428,
“y”: 0.17325483
},
{
“x”: 0.37834623,
“y”: 0.17325483
},
{
“x”: 0.37834623,
“y”: 0.19512194
},
{
“x”: 0.20880428,
“y”: 0.19512194
}
]
}
}
]
},
“id”: “3”
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “1291”,
“endIndex”: “1300”
}
],
“content”: “16,110.00”
},
“type”: “net_amount”,
“mentionText”: “16,110.00”,
“confidence”: 0.92172015,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.86079717,
“y”: 0.73044574
},
{
“x”: 0.93991673,
“y”: 0.73044574
},
{
“x”: 0.93991673,
“y”: 0.74432296
},
{
“x”: 0.86079717,
“y”: 0.74432296
}
]
}
}
]
},
“id”: “4”,
“normalizedValue”: {
“text”: “16110”
}
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “1830”,
“endIndex”: “1833”
}
],
“content”: “USD”
},
“type”: “currency”,
“mentionText”: “USD”,
“confidence”: 0.8704995,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.6954194,
“y”: 0.76576954
},
{
“x”: 0.7209994,
“y”: 0.76576954
},
{
“x”: 0.7209994,
“y”: 0.7783852
},
{
“x”: 0.6954194,
“y”: 0.7783852
}
]
}
}
]
},
“id”: “5”,
“normalizedValue”: {
“text”: “USD”
}
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “340”,
“endIndex”: “362”
}
],
“content”: “60 days from Inv. Date”
},
“type”: “payment_terms”,
“mentionText”: “60 days from Inv. Date”,
“confidence”: 0.7146772,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.7638311,
“y”: 0.29394448
},
{
“x”: 0.89827484,
“y”: 0.29394448
},
{
“x”: 0.89827484,
“y”: 0.30824223
},
{
“x”: 0.7638311,
“y”: 0.30824223
}
]
}
}
]
},
“id”: “6”
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “96”,
“endIndex”: “116”
}
],
“content”: “.com”
},
“type”: “supplier_website”,
“mentionText”: “e.com”,
“confidence”: 0.6468903,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.56157047,
“y”: 0.1312027
},
{
“x”: 0.7430101,
“y”: 0.1312027
},
{
“x”: 0.7430101,
“y”: 0.14550042
},
{
“x”: 0.56157047,
“y”: 0.14550042
}
]
}
}
]
},
“id”: “7”
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “3”,
“endIndex”: “26”
}
],
“content”: “INDIA WIDE LOGISTICS”
},
“type”: “supplier_name”,
“mentionText”: “INDIA WIDE LOGISTICS”,
“confidence”: 0.6138423,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.56632954,
“y”: 0.042472664
},
{
“x”: 0.78167754,
“y”: 0.042472664
},
{
“x”: 0.78167754,
“y”: 0.058873
},
{
“x”: 0.56632954,
“y”: 0.058873
}
]
}
}
]
},
“id”: “8”,
“normalizedValue”: {
“text”: “istics”
}
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “27”,
“endIndex”: “70”
}
],
“content”: “7\nUSA”
},
“type”: “supplier_address”,
“mentionText”: “7\nUSA”,
“confidence”: 0.5933487,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.56276023,
“y”: 0.058873
},
{
“x”: 0.7447948,
“y”: 0.058873
},
{
“x”: 0.7447948,
“y”: 0.10639193
},
{
“x”: 0.56276023,
“y”: 0.10639193
}
]
}
}
]
},
“id”: “9”,
“normalizedValue”: {
“text”: " USA",
“addressValue”: {
“regionCode”: “US”,
“languageCode”: “en-US”,
“postalCode”: “”,
“administrativeArea”: “Illois”,
“locality”: “Palatine”,
“addressLines”: [
“d”
]
}
}
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “78”,
“endIndex”: “95”
}
],
“content”: “11”
},
“type”: “supplier_phone”,
“mentionText”: “11”,
“confidence”: 0.59013975,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.6323617,
“y”: 0.10933558
},
{
“x”: 0.7662106,
“y”: 0.10933558
},
{
“x”: 0.7662106,
“y”: 0.12657696
},
{
“x”: 0.6323617,
“y”: 0.12657696
}
]
}
}
]
},
“id”: “10”,
“normalizedValue”: {
“text”: “66 0711”
}
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “684”,
“endIndex”: “700”
}
],
“content”: “0003001003-00150”
},
“type”: “purchase_order”,
“mentionText”: “0003001003-00150”,
“confidence”: 0.5397213,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.215348,
“y”: 0.490328
},
{
“x”: 0.33372992,
“y”: 0.490328
},
{
“x”: 0.33372992,
“y”: 0.50546676
},
{
“x”: 0.215348,
“y”: 0.50546676
}
]
}
}
]
},
“id”: “11”
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “2087”,
“endIndex”: “2136”
}
],
“content”: “PONITED STATES”
},
“type”: “remit_to_address”,
“mentionText”: “PO nUNITED STATES”,
“confidence”: 0.44959384,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.50386673,
“y”: 0.84020185
},
{
“x”: 0.6561571,
“y”: 0.84020185
},
{
“x”: 0.6561571,
“y”: 0.8713204
},
{
“x”: 0.50386673,
“y”: 0.8713204
}
]
}
}
]
},
“id”: “12”
},
{
“type”: “invoice_type”,
“confidence”: 0.3908778,
“pageAnchor”: {
“pageRefs”: [
{}
]
},
“id”: “13”,
“normalizedValue”: {
“text”: “invoice_statement”
}
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “2057”,
“endIndex”: “2086”
}
],
“content”: " LOGISTICS, INC."
},
“type”: “remit_to_name”,
“mentionText”: " LOGISTICS, INC.“,
“confidence”: 0.20493957,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.50743604,
“y”: 0.8292683
},
{
“x”: 0.72635335,
“y”: 0.8292683
},
{
“x”: 0.72635335,
“y”: 0.842725
},
{
“x”: 0.50743604,
“y”: 0.842725
}
]
}
}
]
},
“id”: “14”
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “1856”,
“endIndex”: “1866”
}
],
“content”: “WHIRLPSXX1”
},
“type”: “supplier_tax_id”,
“mentionText”: “WHISXX1”,
“confidence”: 0.152821,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.20464009,
“y”: 0.79268295
},
{
“x”: 0.29625222,
“y”: 0.79268295
},
{
“x”: 0.29625222,
“y”: 0.8061396
},
{
“x”: 0.20464009,
“y”: 0.8061396
}
]
}
}
]
},
“id”: “15”
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “1083”,
“endIndex”: “1114”
}
],
“content”: “ABCEE = Columbus, United States”
},
“type”: “ship_to_address”,
“mentionText”: “ABCDE = Columbus, United States”,
“confidence”: 0.08760377,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.50386673,
“y”: 0.57611436
},
{
“x”: 0.71802497,
“y”: 0.57611436
},
{
“x”: 0.71802497,
“y”: 0.58915055
},
{
“x”: 0.50386673,
“y”: 0.58915055
}
]
}
}
]
},
“id”: “16”
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “1206”,
“endIndex”: “1271”
},
{
“startIndex”: “1272”,
“endIndex”: “1281”
}
]
},
“type”: “line_item”,
“mentionText”: " 16,110.00”,
“confidence”: 1,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.0594884,
“y”: 0.65937763
},
{
“x”: 0.9405116,
“y”: 0.65937763
},
{
“x”: 0.9405116,
“y”: 0.67535746
},
{
“x”: 0.0594884,
“y”: 0.67535746
}
]
}
}
]
},
“id”: “17”,
“properties”: [
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “1206”,
“endIndex”: “1271”
}
],
“content”: “0’ CONTAINER @ $8,055”
},
“type”: “line_item/description”,
“mentionText”: " 40’ CONTAINER @ $8,055",
“confidence”: 0.6885872,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.0594884,
“y”: 0.65937763
},
{
“x”: 0.6508031,
“y”: 0.65937763
},
{
“x”: 0.6508031,
“y”: 0.67535746
},
{
“x”: 0.0594884,
“y”: 0.67535746
}
]
}
}
]
},
“id”: “18”
},
{
“textAnchor”: {
“textSegments”: [
{
“startIndex”: “1272”,
“endIndex”: “1281”
}
],
“content”: “16,110.00”
},
“type”: “line_item/amount”,
“mentionText”: “16,110.00”,
“confidence”: 0.8672323,
“pageAnchor”: {
“pageRefs”: [
{
“boundingPoly”: {
“normalizedVertices”: [
{
“x”: 0.86020225,
“y”: 0.65979815
},
{
“x”: 0.9405116,
“y”: 0.65979815
},
{
“x”: 0.9405116,
“y”: 0.67283434
},
{
“x”: 0.86020225,
“y”: 0.67283434
}
]
}
}
]
},
“id”: “19”,
“normalizedValue”: {
“text”: “16110”
}
}
]
}
]
},
“humanReviewStatus”: {
“state”: “SKIPPED”
}
}
I wanted to extract the data associated with the below fields:
1.invoice_id
2.invoice_date
3.ship_from_name
4.ship_to_address
5.total_amount
6.supplier_name
Kindly suggesr
Link
Date
2025-03-17
Related UiPath products
Studio