File size: 2,196 Bytes
fd206e2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
{
  "$schema": "https://json-schema.org/draft/2020-12/schema",
  "$id": "german-ocr-3/schemas/form.json",
  "title": "GermanOCR3 Form (Formular)",
  "description": "Generisches Schema fuer ausgefuellte deutsche Formulare. Felder werden als Liste von Label/Value-Paaren geliefert, plus optionale Checkbox-Liste und Unterschriften.",
  "type": "object",
  "additionalProperties": false,
  "required": ["document_type", "language", "fields"],
  "properties": {
    "document_type": {"const": "form"},
    "language": {"type": "string", "default": "de"},
    "form_title": {"type": ["string", "null"]},
    "form_id": {"description": "z.B. Antragsnummer / Formularkennung", "type": ["string", "null"]},
    "issuing_authority": {"type": ["string", "null"]},

    "fields": {
      "type": "array",
      "description": "Erkannte Label/Wert-Paare in Lesereihenfolge.",
      "items": {
        "type": "object",
        "additionalProperties": false,
        "required": ["label", "value"],
        "properties": {
          "label": {"type": "string"},
          "value": {"type": ["string", "number", "boolean", "null"]},
          "section": {"type": ["string", "null"]},
          "page": {"type": ["integer", "null"]}
        }
      }
    },

    "checkboxes": {
      "type": "array",
      "default": [],
      "items": {
        "type": "object",
        "additionalProperties": false,
        "required": ["label", "checked"],
        "properties": {
          "label": {"type": "string"},
          "checked": {"type": "boolean"},
          "section": {"type": ["string", "null"]}
        }
      }
    },

    "signatures": {
      "type": "array",
      "default": [],
      "items": {
        "type": "object",
        "additionalProperties": false,
        "properties": {
          "by": {"type": ["string", "null"]},
          "place": {"type": ["string", "null"]},
          "date": {"type": ["string", "null"]},
          "present": {"type": "boolean"}
        }
      }
    },

    "raw_text": {"type": ["string", "null"]},
    "confidence": {"type": ["number", "null"], "minimum": 0, "maximum": 1},
    "notes": {"type": "array", "items": {"type": "string"}, "default": []}
  }
}