mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-13 18:56:36 +03:00
Restore missing normalization from gold align
PR #4526 missed extra lower-casing and spacing normalization.
This commit is contained in:
parent
554850206c
commit
bddfbc7e1b
|
@ -77,6 +77,7 @@ _NORM_MAP = {"``": '"', "''": '"'}
|
||||||
|
|
||||||
|
|
||||||
def _normalize(tokens):
|
def _normalize(tokens):
|
||||||
|
tokens = [w.replace(" ", "").lower() for w in tokens]
|
||||||
return [_NORM_MAP.get(word, word) for word in tokens]
|
return [_NORM_MAP.get(word, word) for word in tokens]
|
||||||
|
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue
Block a user