Move language-specific tests to tests/lang

2025-11-22 18:55:43 +03:00 · 2017-05-09 00:02:37 +02:00 · 2017-05-09 00:02:37 +02:00 · c714841cc8
commit c714841cc8
parent bd57b611cc
25 changed files with 4 additions and 9 deletions
--- a/spacy/tests/bn/init.py
+++ b/spacy/tests/bn/init.py
@ -1 +0,0 @@
-# coding: utf-8
--- a/spacy/tests/fr/init.py
+++ b/spacy/tests/fr/init.py
@ -1 +0,0 @@
-# coding: utf-8
--- a/spacy/tests/lang/bn/test_tokenizer.py
+++ b/spacy/tests/lang/bn/test_tokenizer.py
--- a/spacy/tests/lang/de/test_exceptions.py
+++ b/spacy/tests/lang/de/test_exceptions.py
--- a/spacy/tests/lang/de/test_prefix_suffix_infix.py
+++ b/spacy/tests/lang/de/test_prefix_suffix_infix.py
--- a/spacy/tests/lang/de/test_text.py
+++ b/spacy/tests/lang/de/test_text.py
--- a/spacy/tests/lang/en/test_contractions.py
+++ b/spacy/tests/lang/en/test_contractions.py
--- a/spacy/tests/lang/en/test_exceptions.py
+++ b/spacy/tests/lang/en/test_exceptions.py
--- a/spacy/tests/lang/en/test_indices.py
+++ b/spacy/tests/lang/en/test_indices.py
--- a/spacy/tests/lang/en/test_prefix_suffix_infix.py
+++ b/spacy/tests/lang/en/test_prefix_suffix_infix.py
--- a/spacy/tests/lang/en/test_punct.py
+++ b/spacy/tests/lang/en/test_punct.py
@ -6,8 +6,8 @@ from __future__ import unicode_literals

 import pytest

-from ...util import compile_prefix_regex
-from ...language_data import TOKENIZER_PREFIXES
+from ....util import compile_prefix_regex
+from ....lang.punctuation import TOKENIZER_PREFIXES


 PUNCT_OPEN = ['(', '[', '{', '*']
--- a/spacy/tests/lang/en/test_text.py
+++ b/spacy/tests/lang/en/test_text.py
--- a/spacy/tests/lang/es/test_exception.py
+++ b/spacy/tests/lang/es/test_exception.py
--- a/spacy/tests/lang/es/test_text.py
+++ b/spacy/tests/lang/es/test_text.py
--- a/spacy/tests/lang/fi/test_tokenizer.py
+++ b/spacy/tests/lang/fi/test_tokenizer.py
@ -3,15 +3,14 @@ from __future__ import unicode_literals

 import pytest

+
 ABBREVIATION_TESTS = [
    ('Hyvää uutta vuotta t. siht. Niemelä!', ['Hyvää', 'uutta', 'vuotta', 't.', 'siht.', 'Niemelä', '!']),
    ('Paino on n. 2.2 kg', ['Paino', 'on', 'n.', '2.2', 'kg'])
 ]

-TESTCASES = ABBREVIATION_TESTS

-
-@pytest.mark.parametrize('text,expected_tokens', TESTCASES)
+@pytest.mark.parametrize('text,expected_tokens', ABBREVIATION_TESTS)
 def test_tokenizer_handles_testcases(fi_tokenizer, text, expected_tokens):
    tokens = fi_tokenizer(text)
    token_list = [token.text for token in tokens if not token.is_space]
--- a/spacy/tests/lang/fr/test_exceptions.py
+++ b/spacy/tests/lang/fr/test_exceptions.py
--- a/spacy/tests/lang/fr/test_lemmatization.py
+++ b/spacy/tests/lang/fr/test_lemmatization.py
--- a/spacy/tests/lang/fr/test_text.py
+++ b/spacy/tests/lang/fr/test_text.py
@ -1,6 +1,4 @@
 # coding: utf8
-
-
 from __future__ import unicode_literals


--- a/spacy/tests/lang/he/test_tokenizer.py
+++ b/spacy/tests/lang/he/test_tokenizer.py
--- a/spacy/tests/lang/hu/init.py
+++ b/spacy/tests/lang/hu/init.py
--- a/spacy/tests/lang/hu/test_tokenizer.py
+++ b/spacy/tests/lang/hu/test_tokenizer.py
--- a/spacy/tests/lang/nb/init.py
+++ b/spacy/tests/lang/nb/init.py
--- a/spacy/tests/lang/nb/test_tokenizer.py
+++ b/spacy/tests/lang/nb/test_tokenizer.py
--- a/spacy/tests/lang/sv/init.py
+++ b/spacy/tests/lang/sv/init.py
--- a/spacy/tests/lang/sv/test_tokenizer.py
+++ b/spacy/tests/lang/sv/test_tokenizer.py