Sample JSON template: IDDPTemplate_v3_1_tr.json
Sample JSON Template: IDDPTemplate_v3_1_tr.json
{
"DocumentTypeId": "Direct Order Form",
"TemplateID": "directorder1",
"Page": [
{
"PageID": "1",
"StartReg": "",
"EndReg": "",
"Fields": [
{
"FieldName": "Entity_Name",
"Type": "Text",
"ExtractionParser": [
{
"Type": "REExtractor",
"PaserInput": {
"regtext": "Agreement between ([\\s\\S]*?) and [\\s\\S]*? \\(\"Licensee\"\\)"
}
}
]
},
{
"FieldName": "Document Name",
"Type": "Text",
"ExtractionParser": [
{
"Type": "ROIExtractor",
"PaserInput": {
"Height": 0.0092,
"Width": 0.0781,
"Top": 0.1020,
"Left": 0.4605
}
}
]
}
],
"Tables": [
{
"TableName": "ComponentSystems1",
"ExtractionParserType": {
"Type": "TableREExtractor",
"PaserInput": {
"StartRegEx": "PROD",
"EndRegEx": "TEST",
"HasHeader": false,
"RowReg": "(\\d+)\\s+((?:[A-Z0-9]+-[A-Z0-9-]*))\\s+([\\S ]+)\\s+(\\d+)\\s+(\\w+)\\s+(\\w+)",
"ColumnConfiguration": [
{
"ColumnNumber": 1,
"ColumnName": "ID",
"RegEx": "\\d+[.?]*"
},
{
"ColumnNumber": 2,
"ColumnName": "Part",
"RegEx": "(?:[A-Z0-9]+-[A-Z0-9-]*)",
"Multiline": true
},
{
"ColumnNumber": 3,
"ColumnName": "Component_Systems",
"RegEx": "[\\S ]+",
"Multiline": false
},
{
"ColumnNumber": 4,
"ColumnName": "Quantity",
"RegEx": "\\d+"
},
{
"ColumnNumber": 5,
"ColumnName": "Type",
"RegEx": "\\w+"
},
{
"ColumnNumber": 6,
"ColumnName": "Support_Level",
"RegEx": "\\w+"
}
]
}
}
},
{
"TableName": "ENV",
"ExtractionParserType": {
"Type": "TableREExtractor",
"PaserInput": {
"StartRegEx": "*",
"EndRegEx": "*",
"HasHeader": true,
"RowReg": "*",
"ColumnConfiguration": "*"
}
}
},
{
"TableName": "TESTTAB",
"ExtractionParserType": {
"Type": "TableROIExtractor",
"PaserInput": {
"Geometry": [0.08294117647058824, 0.7781818181818182, 0.8635294117647059, 0.14454545454545453],
"HasHeader": true,
"ColumnConfiguration": [
{
"ColumnName": "Part",
"Box": [0.13, 0.7822727272727272, 0.14705882352941174, 0.13454545454545463],
"Type": "",
"RegEx": "(.*?)-.*"
},
{
"ColumnName": "Component Systems",
"Box": [0.2817647058823529, 0.7859090909090909, 0.38, 0.13318181818181818],
"Type": "",
"RegEx": "(\\w+)"
},
{
"ColumnName": "Quantity",
"Box": [0.6611764705882353, 0.7804545454545454, 0.10294117647058831, 0.13818181818181818],
"Type": ""
},
{
"ColumnName": "Type",
"Box": [0.7664705882352941, 0.7868181818181819, 0.06294117647058828, 0.13],
"Type": ""
},
{
"ColumnName": "Support Level",
"Box": [0.8276470588235294, 0.785, 0.11529411764705888, 0.13681818181818184],
"Type": ""
}
]
}
}
},
{
"TableName": "Equipment",
"ExtractionParserType": {
"Type": "KeyValueTableREExtractor",
"PaserInput": {
"Geometry": [0.09588235294117647, 0.10181818181818182, 0.53, 0.06999999999999999]
}
}
}
]
}
],
"StaticData": {
"Issue": "Some static that needs to return",
"DocumentType": "Order Form"
},
"Options": {
"Date Format": "mm-dd-yyyy",
"DecimalSeparator": "."
},
"Keywords": "List of comma seperated keywords.These are\tused to\tpick thecorrect template, we can extend it with Regular Expression ",
"ExcludeKeywords": "List of comma seperated keywords,These are used to exclude document,we can extend it with Regular Expression",
"ConfidenceScore": 90.00
}