blob: 24a7fc2b1d456d1c82ac228dc4585db96d6b0a92 [file] [log] [blame]
id: stts-upos
desc: Mapping between STTS and Universal dependency Part-of-Speech
foundryA: opennlp
layerA: p
foundryB: upos
layerB: p
mappings:
- "[$\\(] <> [PUNCT & PunctType=Brck]"
- "[$,] <> [PUNCT & PunctType=Comm]"
- "[$.] <> [PUNCT & PunctType=Peri]"
- "[ADJA] <> [ADJ]"
- "[ADJD] <> [ADJ & Variant=Short]"
- "[ADV] <> [ADV]"
- "[APPO] <> [ADP & AdpType=Post]"
- "[APPR] <> [ADP & AdpType=Prep]"
- "[APPRART] <> [ADP & AdpType=Prep & PronType=Art]"
- "[APZR] <> [ADP & AdpType=Circ]"
- "[ART] <> [DET & PronType=Art]"
- "[CARD] <> [NUM & NumType=Card]"
- "[FM] <> [X & Foreign=Yes]"
- "[ITJ] <> [INTJ]"
- "[KOKOM] <> [CCONJ & ConjType=Comp]"
- "[KON] <> [CCONJ]"
- "[KOUI] <> [SCONJ]"
- "[KOUS] <> [SCONJ]"
- "[NE] <> [PROPN]"
- "[NN] <> [NOUN]"
- "[PAV] <> [ADV & PronType=Dem]"
- "[PDAT] <> [DET & PronType=Dem]"
- "[PDS] <> [PRON & PronType=Dem]"
- "[PIAT] <> [DET & (PronType=Ind | PronType=Neg | PronType=Tot)]"
- "[PIDAT] <> [DET & AdjType=Pdt & (PronType=Ind | PronType=Neg | PronType=Tot)]"
- "[PIS] <> [PRON & (PronType=Ind | PronType=Neg | PronType=Tot)]"
- "[PPER] <> [PRON & PronType=Prs]"
- "[PPOSAT] <> [DET & Poss=Yes & PronType=Prs]"
- "[PPOSS] <> [PRON & Poss=Yes & PronType=Prs]"
- "[PRELAT] <> [DET & PronType=Rel]"
- "[PRELS] <> [PRON & PronType=Rel]"
- "[PRF] <> [PRON & PronType=Prs & Reflex=Yes]"
- "[PTKA] <> [PART]"
- "[PTKANT] <> [PART & PartType=Res]"
- "[PTKNEG] <> [PART & Polarity=Neg]"
- "[PTKVZ] <> [ADP & PartType=Vbp]"
- "[PTKZU] <> [PART & PartType=Inf]"
- "[PWAT] <> [DET & PronType=Int]"
- "[PWAV] <> [ADV & PronType=Int]"
- "[PWS] <> [PRON & PronType=Int]"
- "[TRUNC] <> [X & Hyph=Yes]"
- "[VAFIN] <> [AUX & Mood=Ind & VerbForm=Fin]"
- "[VAIMP] <> [AUX & Mood=Imp & VerbForm=Fin]"
- "[VAINF] <> [AUX & VerbForm=Inf]"
- "[VAPP] <> [AUX & Aspect=Perf & VerbForm=Part]"
- "[VMFIN] <> [VERB & Mood=Ind & VerbForm=Fin & VerbType=Mod]"
- "[VMINF] <> [VERB & VerbForm=Inf & VerbType=Mod]"
- "[VMPP] <> [VERB & Aspect=Perf & VerbForm=Part & VerbType=Mod]"
- "[VVFIN] <> [VERB & Mood=Ind & VerbForm=Fin]"
- "[VVIMP] <> [VERB & Mood=Imp & VerbForm=Fin]"
- "[VVINF] <> [VERB & VerbForm=Inf]"
- "[VVIZU] <> [VERB & VerbForm=Inf]"
- "[VVPP] <> [VERB & Aspect=Perf & VerbForm=Part]"
- "[XY] <> [X]"
# Fallback rules for bare UPoS tags (less specific, selected only when no
# more-specific rule matches)
- "[ADJA | ADJD] <> [ADJ]"
- "[ART | PDAT | PIAT | PIDAT | PPOSAT | PRELAT | PWAT] <> [DET]"
- "[KOUI | KOUS] <> [SCONJ]"
- "[VVFIN | VVIMP | VVINF | VVIZU | VVPP | VMFIN | VMINF | VMPP] <> [VERB]"
- "[VAFIN | VAIMP | VAINF | VAPP] <> [AUX]"
- "[APPO | APPR | APPRART | APZR | PTKVZ] <> [ADP]"
- "[PDS | PIS | PPER | PPOSS | PRELS | PRF | PWS] <> [PRON]"
- "[PTKA | PTKANT | PTKNEG | PTKZU] <> [PART]"
- "[FM | TRUNC | XY] <> [X]"
- "[$\\( | $, | $.] <> [PUNCT]"
- "[KON | KOKOM] <> [CCONJ]"
- "[ADV | PAV | PWAV] <> [ADV]"
- "[NN | NE] <> [NOUN | PROPN]"