mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-10-31 16:07:41 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			40 lines
		
	
	
		
			1.1 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			40 lines
		
	
	
		
			1.1 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| # coding: utf-8
 | |
| from __future__ import unicode_literals
 | |
| 
 | |
| from ...attrs import LEMMA, ORTH, PROB, IS_ALPHA
 | |
| from ...parts_of_speech import NOUN, VERB
 | |
| 
 | |
| import pytest
 | |
| 
 | |
| 
 | |
| @pytest.mark.parametrize('text1,text2', [
 | |
|     ("Hello", "bye"), ("Hello", "hello"), ("Hello", "Hello,")])
 | |
| def test_vocab_api_neq(en_vocab, text1, text2):
 | |
|     assert en_vocab[text1].orth != en_vocab[text2].orth
 | |
| 
 | |
| 
 | |
| @pytest.mark.parametrize('text', "Hello")
 | |
| def test_vocab_api_eq(en_vocab, text):
 | |
|     lex = en_vocab[text]
 | |
|     assert en_vocab[text].orth == lex.orth
 | |
| 
 | |
| 
 | |
| @pytest.mark.parametrize('text', ["example"])
 | |
| def test_vocab_api_shape_attr(en_vocab, text):
 | |
|     lex = en_vocab[text]
 | |
|     assert lex.orth != lex.shape
 | |
| 
 | |
| 
 | |
| @pytest.mark.parametrize('string,symbol', [
 | |
|     ('IS_ALPHA', IS_ALPHA), ('NOUN', NOUN), ('VERB', VERB), ('LEMMA', LEMMA),
 | |
|     ('ORTH', ORTH), ('PROB', PROB)])
 | |
| def test_vocab_api_symbols(en_vocab, string, symbol):
 | |
|     assert en_vocab.strings[string] == symbol
 | |
| 
 | |
| 
 | |
| @pytest.mark.parametrize('text', "Hello")
 | |
| def test_vocab_api_contains(en_vocab, text):
 | |
|     _ = en_vocab[text]
 | |
|     assert text in en_vocab
 | |
|     assert "LKsdjvlsakdvlaksdvlkasjdvljasdlkfvm" not in en_vocab
 |