mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-25 17:36:30 +03:00
Restore missing normalization from gold align
PR #4526 missed extra lower-casing and spacing normalization.
This commit is contained in:
parent
554850206c
commit
bddfbc7e1b
|
@ -77,6 +77,7 @@ _NORM_MAP = {"``": '"', "''": '"'}
|
|||
|
||||
|
||||
def _normalize(tokens):
|
||||
tokens = [w.replace(" ", "").lower() for w in tokens]
|
||||
return [_NORM_MAP.get(word, word) for word in tokens]
|
||||
|
||||
|
||||
|
|
Loading…
Reference in New Issue
Block a user