Map NR to PROPN (#5512)

This commit is contained in:
adrianeboyd 2020-05-26 22:30:53 +02:00 committed by GitHub
parent f00488ab30
commit aad0610a85
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -2,7 +2,7 @@
from __future__ import unicode_literals from __future__ import unicode_literals
from ...symbols import POS, PUNCT, ADJ, SCONJ, CCONJ, NUM, DET, ADV, ADP, X from ...symbols import POS, PUNCT, ADJ, SCONJ, CCONJ, NUM, DET, ADV, ADP, X
from ...symbols import NOUN, PART, INTJ, PRON, VERB, SPACE from ...symbols import NOUN, PART, INTJ, PRON, VERB, SPACE, PROPN
# The Chinese part-of-speech tagger uses the OntoNotes 5 version of the Penn # The Chinese part-of-speech tagger uses the OntoNotes 5 version of the Penn
# Treebank tag set. We also map the tags to the simpler Universal Dependencies # Treebank tag set. We also map the tags to the simpler Universal Dependencies
@ -28,7 +28,7 @@ TAG_MAP = {
"URL": {POS: X}, "URL": {POS: X},
"INF": {POS: X}, "INF": {POS: X},
"NN": {POS: NOUN}, "NN": {POS: NOUN},
"NR": {POS: NOUN}, "NR": {POS: PROPN},
"NT": {POS: NOUN}, "NT": {POS: NOUN},
"VA": {POS: VERB}, "VA": {POS: VERB},
"VC": {POS: VERB}, "VC": {POS: VERB},