mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-26 18:06:29 +03:00
Fix Korean
This commit is contained in:
parent
159b72ed4c
commit
75514b5970
|
@ -46,7 +46,7 @@ class KoreanTokenizer(DummyTokenizer):
|
||||||
|
|
||||||
def __call__(self, text):
|
def __call__(self, text):
|
||||||
dtokens = list(self.detailed_tokens(text))
|
dtokens = list(self.detailed_tokens(text))
|
||||||
surfaces = [dt.surface for dt in dtokens]
|
surfaces = [dt["surface"] for dt in dtokens]
|
||||||
doc = Doc(self.vocab, words=surfaces, spaces=list(check_spaces(text, surfaces)))
|
doc = Doc(self.vocab, words=surfaces, spaces=list(check_spaces(text, surfaces)))
|
||||||
for token, dtoken in zip(doc, dtokens):
|
for token, dtoken in zip(doc, dtokens):
|
||||||
first_tag, sep, eomi_tags = dtoken["tag"].partition("+")
|
first_tag, sep, eomi_tags = dtoken["tag"].partition("+")
|
||||||
|
|
Loading…
Reference in New Issue
Block a user