mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-25 01:16:28 +03:00
Fix Korean
This commit is contained in:
parent
159b72ed4c
commit
75514b5970
|
@ -46,7 +46,7 @@ class KoreanTokenizer(DummyTokenizer):
|
|||
|
||||
def __call__(self, text):
|
||||
dtokens = list(self.detailed_tokens(text))
|
||||
surfaces = [dt.surface for dt in dtokens]
|
||||
surfaces = [dt["surface"] for dt in dtokens]
|
||||
doc = Doc(self.vocab, words=surfaces, spaces=list(check_spaces(text, surfaces)))
|
||||
for token, dtoken in zip(doc, dtokens):
|
||||
first_tag, sep, eomi_tags = dtoken["tag"].partition("+")
|
||||
|
|
Loading…
Reference in New Issue
Block a user