{ "$schema": "https://json-schema.org/draft/2020-12/schema", "title": "Token-level POS, lemma and morphology annotation", "type": "object", "required": ["sentence_id", "language", "tokens"], "additionalProperties": false, "properties": { "sentence_id": { "type": "string" }, "language": { "type": "string" }, "tokens": { "type": "array", "items": { "type": "object", "required": ["surface", "lemma", "upos", "features", "confidence", "comment"], "additionalProperties": false, "properties": { "surface": { "type": "string" }, "lemma": { "type": ["string", "null"] }, "upos": { "type": "string", "enum": [ "ADJ", "ADP", "ADV", "AUX", "CCONJ", "DET", "INTJ", "NOUN", "NUM", "PART", "PRON", "PROPN", "PUNCT", "SCONJ", "SYM", "VERB", "X" ] }, "features": { "type": "object", "additionalProperties": false, "properties": { "Case": { "type": ["string", "null"] }, "Number": { "type": ["string", "null"] }, "Gender": { "type": ["string", "null"] }, "Person": { "type": ["string", "null"] }, "Tense": { "type": ["string", "null"] }, "Mood": { "type": ["string", "null"] }, "Voice": { "type": ["string", "null"] } } }, "confidence": { "type": "string", "enum": ["low", "medium", "high"] }, "comment": { "type": ["string", "null"] } } } } } }