Update English tag_map

Update English tag_map based on this conversion table:
https://universaldependencies.org/tagset-conversion/en-penn-uposf.html
This commit is contained in:
Adriane Boyd 2019-10-22 09:36:37 +02:00
parent 7772d5d3c5
commit a68d2203e0

View File

@ -28,8 +28,8 @@ TAG_MAP = {
"JJR": {POS: ADJ, "Degree": "comp"}, "JJR": {POS: ADJ, "Degree": "comp"},
"JJS": {POS: ADJ, "Degree": "sup"}, "JJS": {POS: ADJ, "Degree": "sup"},
"LS": {POS: X, "NumType": "ord"}, "LS": {POS: X, "NumType": "ord"},
"MD": {POS: AUX, "VerbType": "mod"}, "MD": {POS: VERB, "VerbType": "mod"},
"NIL": {POS: ""}, "NIL": {POS: X},
"NN": {POS: NOUN, "Number": "sing"}, "NN": {POS: NOUN, "Number": "sing"},
"NNP": {POS: PROPN, "NounType": "prop", "Number": "sing"}, "NNP": {POS: PROPN, "NounType": "prop", "Number": "sing"},
"NNPS": {POS: PROPN, "NounType": "prop", "Number": "plur"}, "NNPS": {POS: PROPN, "NounType": "prop", "Number": "plur"},
@ -37,7 +37,7 @@ TAG_MAP = {
"PDT": {POS: DET}, "PDT": {POS: DET},
"POS": {POS: PART, "Poss": "yes"}, "POS": {POS: PART, "Poss": "yes"},
"PRP": {POS: PRON, "PronType": "prs"}, "PRP": {POS: PRON, "PronType": "prs"},
"PRP$": {POS: PRON, "PronType": "prs", "Poss": "yes"}, "PRP$": {POS: DET, "PronType": "prs", "Poss": "yes"},
"RB": {POS: ADV, "Degree": "pos"}, "RB": {POS: ADV, "Degree": "pos"},
"RBR": {POS: ADV, "Degree": "comp"}, "RBR": {POS: ADV, "Degree": "comp"},
"RBS": {POS: ADV, "Degree": "sup"}, "RBS": {POS: ADV, "Degree": "sup"},
@ -58,9 +58,9 @@ TAG_MAP = {
"Number": "sing", "Number": "sing",
"Person": "three", "Person": "three",
}, },
"WDT": {POS: PRON}, "WDT": {POS: DET},
"WP": {POS: PRON}, "WP": {POS: PRON},
"WP$": {POS: PRON, "Poss": "yes"}, "WP$": {POS: DET, "Poss": "yes"},
"WRB": {POS: ADV}, "WRB": {POS: ADV},
"ADD": {POS: X}, "ADD": {POS: X},
"NFP": {POS: PUNCT}, "NFP": {POS: PUNCT},