spaCy/spacy/tests/lang/el/test_exception.py
Eleni170 6042723535 Add support for Greek language (#2535)
* Add contributor agreement

* Support for Greek language

* Fix missing el_tokenizer
2018-07-10 13:48:38 +02:00

18 lines
573 B
Python

# -*- coding: utf-8 -*-
from __future__ import unicode_literals
import pytest
@pytest.mark.parametrize('text', ["αριθ.", "τρισ.", "δισ.", "σελ."])
def test_tokenizer_handles_abbr(el_tokenizer, text):
tokens = el_tokenizer(text)
assert len(tokens) == 1
def test_tokenizer_handles_exc_in_text(el_tokenizer):
text = "Στα 14 τρισ. δολάρια το κόστος από την άνοδο της στάθμης της θάλασσας."
tokens = el_tokenizer(text)
assert len(tokens) == 14
assert tokens[2].text == "τρισ."