mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-13 05:07:03 +03:00
Fix tag map for German
This commit is contained in:
parent
28326649f3
commit
0fc4e45cb3
|
@ -9,63 +9,63 @@ from ..language_data import TOKENIZER_INFIXES
|
||||||
|
|
||||||
|
|
||||||
TAG_MAP = {
|
TAG_MAP = {
|
||||||
"$(": {TAG: PUNCT, "PunctType": "brck"},
|
"$(": {POS: PUNCT, "PunctType": "brck"},
|
||||||
"$,": {TAG: PUNCT, "PunctType": "comm"},
|
"$,": {POS: PUNCT, "PunctType": "comm"},
|
||||||
"$.": {TAG: PUNCT, "PunctType": "peri"},
|
"$.": {POS: PUNCT, "PunctType": "peri"},
|
||||||
"ADJA": {TAG: ADJ},
|
"ADJA": {POS: ADJ},
|
||||||
"ADJD": {TAG: ADJ, "Variant": "short"},
|
"ADJD": {POS: ADJ, "Variant": "short"},
|
||||||
"ADV": {TAG: ADV},
|
"ADV": {POS: ADV},
|
||||||
"APPO": {TAG: ADP, "AdpType": "post"},
|
"APPO": {POS: ADP, "AdpType": "post"},
|
||||||
"APPR": {TAG: ADP, "AdpType": "prep"},
|
"APPR": {POS: ADP, "AdpType": "prep"},
|
||||||
"APPRART": {TAG: ADP, "AdpType": "prep", "PronType": "art"},
|
"APPRART": {POS: ADP, "AdpType": "prep", "PronType": "art"},
|
||||||
"APZR": {TAG: ADP, "AdpType": "circ"},
|
"APZR": {POS: ADP, "AdpType": "circ"},
|
||||||
"ART": {TAG: DET, "PronType": "art"},
|
"ART": {POS: DET, "PronType": "art"},
|
||||||
"CARD": {TAG: NUM, "NumType": "card"},
|
"CARD": {POS: NUM, "NumType": "card"},
|
||||||
"FM": {TAG: X, "Foreign": "yes"},
|
"FM": {POS: X, "Foreign": "yes"},
|
||||||
"ITJ": {TAG: INTJ},
|
"ITJ": {POS: INTJ},
|
||||||
"KOKOM": {TAG: CONJ, "ConjType": "comp"},
|
"KOKOM": {POS: CONJ, "ConjType": "comp"},
|
||||||
"KON": {TAG: CONJ},
|
"KON": {POS: CONJ},
|
||||||
"KOUI": {TAG: SCONJ},
|
"KOUI": {POS: SCONJ},
|
||||||
"KOUS": {TAG: SCONJ},
|
"KOUS": {POS: SCONJ},
|
||||||
"NE": {TAG: PROPN},
|
"NE": {POS: PROPN},
|
||||||
"NNE": {TAG: PROPN},
|
"NNE": {POS: PROPN},
|
||||||
"NN": {TAG: NOUN},
|
"NN": {POS: NOUN},
|
||||||
"PAV": {TAG: ADV, "PronType": "dem"},
|
"PAV": {POS: ADV, "PronType": "dem"},
|
||||||
"PROAV": {TAG: ADV, "PronType": "dem"},
|
"PROAV": {POS: ADV, "PronType": "dem"},
|
||||||
"PDAT": {TAG: DET, "PronType": "dem"},
|
"PDAT": {POS: DET, "PronType": "dem"},
|
||||||
"PDS": {TAG: PRON, "PronType": "dem"},
|
"PDS": {POS: PRON, "PronType": "dem"},
|
||||||
"PIAT": {TAG: DET, "PronType": "ind|neg|tot"},
|
"PIAT": {POS: DET, "PronType": "ind|neg|tot"},
|
||||||
"PIDAT": {TAG: DET, "AdjType": "pdt", "PronType": "ind|neg|tot"},
|
"PIDAT": {POS: DET, "AdjType": "pdt", "PronType": "ind|neg|tot"},
|
||||||
"PIS": {TAG: PRON, "PronType": "ind|neg|tot"},
|
"PIS": {POS: PRON, "PronType": "ind|neg|tot"},
|
||||||
"PPER": {TAG: PRON, "PronType": "prs"},
|
"PPER": {POS: PRON, "PronType": "prs"},
|
||||||
"PPOSAT": {TAG: DET, "Poss": "yes", "PronType": "prs"},
|
"PPOSAT": {POS: DET, "Poss": "yes", "PronType": "prs"},
|
||||||
"PPOSS": {TAG: PRON, "Poss": "yes", "PronType": "prs"},
|
"PPOSS": {POS: PRON, "Poss": "yes", "PronType": "prs"},
|
||||||
"PRELAT": {TAG: DET, "PronType": "rel"},
|
"PRELAT": {POS: DET, "PronType": "rel"},
|
||||||
"PRELS": {TAG: PRON, "PronType": "rel"},
|
"PRELS": {POS: PRON, "PronType": "rel"},
|
||||||
"PRF": {TAG: PRON, "PronType": "prs", "Reflex": "yes"},
|
"PRF": {POS: PRON, "PronType": "prs", "Reflex": "yes"},
|
||||||
"PTKA": {TAG: PART},
|
"PTKA": {POS: PART},
|
||||||
"PTKANT": {TAG: PART, "PartType": "res"},
|
"PTKANT": {POS: PART, "PartType": "res"},
|
||||||
"PTKNEG": {TAG: PART, "Negative": "yes"},
|
"PTKNEG": {POS: PART, "Negative": "yes"},
|
||||||
"PTKVZ": {TAG: PART, "PartType": "vbp"},
|
"PTKVZ": {POS: PART, "PartType": "vbp"},
|
||||||
"PTKZU": {TAG: PART, "PartType": "inf"},
|
"PTKZU": {POS: PART, "PartType": "inf"},
|
||||||
"PWAT": {TAG: DET, "PronType": "int"},
|
"PWAT": {POS: DET, "PronType": "int"},
|
||||||
"PWAV": {TAG: ADV, "PronType": "int"},
|
"PWAV": {POS: ADV, "PronType": "int"},
|
||||||
"PWS": {TAG: PRON, "PronType": "int"},
|
"PWS": {POS: PRON, "PronType": "int"},
|
||||||
"TRUNC": {TAG: X, "Hyph": "yes"},
|
"TRUNC": {POS: X, "Hyph": "yes"},
|
||||||
"VAFIN": {TAG: AUX, "Mood": "ind", "VerbForm": "fin"},
|
"VAFIN": {POS: AUX, "Mood": "ind", "VerbForm": "fin"},
|
||||||
"VAIMP": {TAG: AUX, "Mood": "imp", "VerbForm": "fin"},
|
"VAIMP": {POS: AUX, "Mood": "imp", "VerbForm": "fin"},
|
||||||
"VAINF": {TAG: AUX, "VerbForm": "inf"},
|
"VAINF": {POS: AUX, "VerbForm": "inf"},
|
||||||
"VAPP": {TAG: AUX, "Aspect": "perf", "VerbForm": "part"},
|
"VAPP": {POS: AUX, "Aspect": "perf", "VerbForm": "part"},
|
||||||
"VMFIN": {TAG: VERB, "Mood": "ind", "VerbForm": "fin", "VerbType": "mod"},
|
"VMFIN": {POS: VERB, "Mood": "ind", "VerbForm": "fin", "VerbType": "mod"},
|
||||||
"VMINF": {TAG: VERB, "VerbForm": "inf", "VerbType": "mod"},
|
"VMINF": {POS: VERB, "VerbForm": "inf", "VerbType": "mod"},
|
||||||
"VMPP": {TAG: VERB, "Aspect": "perf", "VerbForm": "part", "VerbType": "mod"},
|
"VMPP": {POS: VERB, "Aspect": "perf", "VerbForm": "part", "VerbType": "mod"},
|
||||||
"VVFIN": {TAG: VERB, "Mood": "ind", "VerbForm": "fin"},
|
"VVFIN": {POS: VERB, "Mood": "ind", "VerbForm": "fin"},
|
||||||
"VVIMP": {TAG: VERB, "Mood": "imp", "VerbForm": "fin"},
|
"VVIMP": {POS: VERB, "Mood": "imp", "VerbForm": "fin"},
|
||||||
"VVINF": {TAG: VERB, "VerbForm": "inf"},
|
"VVINF": {POS: VERB, "VerbForm": "inf"},
|
||||||
"VVIZU": {TAG: VERB, "VerbForm": "inf"},
|
"VVIZU": {POS: VERB, "VerbForm": "inf"},
|
||||||
"VVPP": {TAG: VERB, "Aspect": "perf", "VerbForm": "part"},
|
"VVPP": {POS: VERB, "Aspect": "perf", "VerbForm": "part"},
|
||||||
"XY": {TAG: X},
|
"XY": {POS: X},
|
||||||
"SP": {TAG: SPACE}
|
"SP": {POS: SPACE}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue
Block a user