mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-10-26 13:41:21 +03:00 
			
		
		
		
	unicode string for python 2.7
This commit is contained in:
		
							parent
							
								
									eca9cc5417
								
							
						
					
					
						commit
						673c81bbb4
					
				|  | @ -70,6 +70,6 @@ yet you your yours yourself yourselves | ||||||
| ) | ) | ||||||
| 
 | 
 | ||||||
| for hyphen in ["'", "`", "‘", "´", "’"]: | for hyphen in ["'", "`", "‘", "´", "’"]: | ||||||
|     for stopword in "n't 'd 'll 'm 're 's 've".split(): |     for stopword in u"n't 'd 'll 'm 're 's 've".split(): | ||||||
|         STOP_WORDS.add(stopword.replace("'", hyphen)) |         STOP_WORDS.add(stopword.replace("'", hyphen)) | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -4,10 +4,10 @@ import pytest | ||||||
| @pytest.mark.parametrize( | @pytest.mark.parametrize( | ||||||
|     "word", |     "word", | ||||||
|     [ |     [ | ||||||
|         "don't", |         u"don't", | ||||||
|         "don’t", |         u"don’t", | ||||||
|         "I'd", |         u"I'd", | ||||||
|         "I’d", |         u"I’d", | ||||||
|     ], |     ], | ||||||
| ) | ) | ||||||
| def test_issue3521(en_tokenizer, word): | def test_issue3521(en_tokenizer, word): | ||||||
|  |  | ||||||
		Loading…
	
		Reference in New Issue
	
	Block a user