diff --git a/spacy/tests/regression/test_issue792.py b/spacy/tests/regression/test_issue792.py new file mode 100644 index 000000000..231261523 --- /dev/null +++ b/spacy/tests/regression/test_issue792.py @@ -0,0 +1,10 @@ +# coding: utf-8 +from __future__ import unicode_literals + + +@pytest.mark.xfail +@pytest.mark.parametrize('text', ["This is a string ", "This is a string\u0020"]) +def test_issue792(en_tokenizer, text): + """Test for Issue #792: Trailing whitespace is removed after parsing.""" + doc = en_tokenizer(text) + assert(doc.text_with_ws == text)