mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-11-04 01:48:04 +03:00 
			
		
		
		
	Switch default train corpus max_length to 0 in quickstart (#8142)
The behavior of `spacy.Corpus.v1` is unexpected enough for `max_length != 0` that `0` is a better default for users creating a new config with the quickstart. If not, documents are skipped, sometimes the entire corpus is skipped, and sometimes documents are (quite unexpectedly for your average user) split into sentences.
This commit is contained in:
		
							parent
							
								
									4e69fcaa50
								
							
						
					
					
						commit
						cd6bd91c3a
					
				| 
						 | 
					@ -372,7 +372,7 @@ factory = "{{ pipe }}"
 | 
				
			||||||
[corpora.train]
 | 
					[corpora.train]
 | 
				
			||||||
@readers = "spacy.Corpus.v1"
 | 
					@readers = "spacy.Corpus.v1"
 | 
				
			||||||
path = ${paths.train}
 | 
					path = ${paths.train}
 | 
				
			||||||
max_length = {{ 500 if hardware == "gpu" else 2000 }}
 | 
					max_length = 0
 | 
				
			||||||
 | 
					
 | 
				
			||||||
[corpora.dev]
 | 
					[corpora.dev]
 | 
				
			||||||
@readers = "spacy.Corpus.v1"
 | 
					@readers = "spacy.Corpus.v1"
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
		Loading…
	
		Reference in New Issue
	
	Block a user