From 713d7c0aa0cc4524f29361a03d6edb26b9936d07 Mon Sep 17 00:00:00 2001 From: Jim Geovedi Date: Sun, 20 Aug 2017 12:17:14 +0700 Subject: [PATCH] added indonesian lang test --- spacy/tests/conftest.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/spacy/tests/conftest.py b/spacy/tests/conftest.py index 200f9ff4f..e0e999f4c 100644 --- a/spacy/tests/conftest.py +++ b/spacy/tests/conftest.py @@ -11,8 +11,8 @@ from ..strings import StringStore from .. import util -_languages = ['bn', 'da', 'de', 'en', 'es', 'fi', 'fr', 'he', 'hu', 'it', 'nb', - 'nl', 'pl', 'pt', 'sv', 'xx'] +_languages = ['bn', 'da', 'de', 'en', 'es', 'fi', 'fr', 'he', 'hu', 'id', + 'it', 'nb', 'nl', 'pl', 'pt', 'sv', 'xx'] _models = {'en': ['en_depent_web_sm', 'en_core_web_md'], 'de': ['de_core_news_md'], 'fr': ['fr_depvec_web_lg'], @@ -86,6 +86,9 @@ def hu_tokenizer(): def fi_tokenizer(): return util.get_lang_class('fi').Defaults.create_tokenizer() +@pytest.fixture +def id_tokenizer(): + return util.get_lang_class('id').Defaults.create_tokenizer() @pytest.fixture def sv_tokenizer():