mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-10-31 16:07:41 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			29 lines
		
	
	
		
			822 B
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			29 lines
		
	
	
		
			822 B
		
	
	
	
		
			Python
		
	
	
	
	
	
| from spacy.util import filter_spans
 | |
| from pydantic import ValidationError
 | |
| from spacy.schemas import TokenPattern, TokenPatternSchema
 | |
| import pytest
 | |
| 
 | |
| 
 | |
| def test_issue6207(en_tokenizer):
 | |
|     doc = en_tokenizer("zero one two three four five six")
 | |
| 
 | |
|     # Make spans
 | |
|     s1 = doc[:4]
 | |
|     s2 = doc[3:6]  # overlaps with s1
 | |
|     s3 = doc[5:7]  # overlaps with s2, not s1
 | |
| 
 | |
|     result = filter_spans((s1, s2, s3))
 | |
|     assert s1 in result
 | |
|     assert s2 not in result
 | |
|     assert s3 in result
 | |
| 
 | |
| 
 | |
| def test_issue6258():
 | |
|     """Test that the non-empty constraint pattern field is respected"""
 | |
|     # These one is valid
 | |
|     TokenPatternSchema(pattern=[TokenPattern()])
 | |
|     # But an empty pattern list should fail to validate
 | |
|     # based on the schema's constraint
 | |
|     with pytest.raises(ValidationError):
 | |
|         TokenPatternSchema(pattern=[])
 |