..  
		
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										bn
									
								 
							
						
					 
				 
				
					
						
							
							Merge pull request  #885  from PySUST/master 
						
					 
				 
				2017-03-12 13:20:59 +01:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										cli
									
								 
							
						
					 
				 
				
					
						
							
							Fix whitespace 
						
					 
				 
				2017-04-07 13:28:48 +02:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										data
									
								 
							
						
					 
				 
				
					
						
							
							Make spacy/data a package 
						
					 
				 
				2017-03-18 20:04:22 +01:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										de
									
								 
							
						
					 
				 
				
					
						
							
							Handle deprecated language-specific model downloading 
						
					 
				 
				2017-03-15 17:37:55 +01:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										en
									
								 
							
						
					 
				 
				
					
						
							
							Add missing tags to verbs ( resolves   #948 ) 
						
					 
				 
				2017-04-03 18:12:52 +02:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										es
									
								 
							
						
					 
				 
				
					
						
							
							feature(model): Add support for creating the Spanish model, including rich tagset, configuration, and basich tests 
						
					 
				 
				2017-04-06 18:48:45 +02:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										fi
									
								 
							
						
					 
				 
				
					
						
							
							Remove duplicate keys in [en|fi] data dicts 
						
					 
				 
				2017-03-19 11:40:29 +01:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										fr
									
								 
							
						
					 
				 
				
					
						
							
							Use consistent unicode declarations 
						
					 
				 
				2017-03-12 13:07:28 +01:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										he
									
								 
							
						
					 
				 
				
					
						
							
							add hebrew tokenizer 
						
					 
				 
				2017-03-24 18:27:44 +03:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										hu
									
								 
							
						
					 
				 
				
					
						
							
							Use consistent unicode declarations 
						
					 
				 
				2017-03-12 13:07:28 +01:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										it
									
								 
							
						
					 
				 
				
					
						
							
							Use consistent unicode declarations 
						
					 
				 
				2017-03-12 13:07:28 +01:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										language_data
									
								 
							
						
					 
				 
				
					
						
							
							Add / to tokenizer infixes ( resolves   #891 ) 
						
					 
				 
				2017-04-07 17:30:44 +02:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										munge
									
								 
							
						
					 
				 
				
					
						
							
							* Fix Python3 problem in align_raw 
						
					 
				 
				2015-07-28 16:06:53 +02:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										nl
									
								 
							
						
					 
				 
				
					
						
							
							Use consistent unicode declarations 
						
					 
				 
				2017-03-12 13:07:28 +01:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										pt
									
								 
							
						
					 
				 
				
					
						
							
							Import and combine Portuguese tokenizer exceptions (see  #943 ) 
						
					 
				 
				2017-04-01 10:37:42 +02:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										serialize
									
								 
							
						
					 
				 
				
					
						
							
							Fix Issue  #459  -- failed to deserialize empty doc. 
						
					 
				 
				2016-10-23 16:31:05 +02:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										sv
									
								 
							
						
					 
				 
				
					
						
							
							Use consistent unicode declarations 
						
					 
				 
				2017-03-12 13:07:28 +01:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										syntax
									
								 
							
						
					 
				 
				
					
						
							
							WIP on add_label bug during NER training 
						
					 
				 
				2017-04-14 23:52:17 +02:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										tests
									
								 
							
						
					 
				 
				
					
						
							
							Add unicode declaration on new regression test 
						
					 
				 
				2017-04-07 18:09:23 +02:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										tokens
									
								 
							
						
					 
				 
				
					
						
							
							Remove whitespace 
						
					 
				 
				2017-04-01 10:21:08 +02:00  
		
			
			
			
			
				
					
						
							
								
								
									
									
									
										zh
									
								 
							
						
					 
				 
				
					
						
							
							Import Jieba inside zh.make_doc 
						
					 
				 
				2016-11-02 23:49:19 +01:00  
		
			
			
			
			
				
					
						
							
								__init__.pxd 
							
						
					 
				 
				
					
						
							
							* Seems to be working after refactor. Need to wire up more POS tag features, and wire up save/load of POS tags. 
						
					 
				 
				2014-10-24 02:23:42 +11:00  
		
			
			
			
			
				
					
						
							
								__init__.py 
							
						
					 
				 
				
					
						
							
							Add Hebrew to init and setup.py 
						
					 
				 
				2017-03-29 10:34:57 +02:00  
		
			
			
			
			
				
					
						
							
								__main__.py 
							
						
					 
				 
				
					
						
							
							Add convert command 
						
					 
				 
				2017-04-07 13:04:17 +02:00  
		
			
			
			
			
				
					
						
							
								about.py 
							
						
					 
				 
				
					
						
							
							Increment version 
						
					 
				 
				2017-04-07 18:45:06 +02:00  
		
			
			
			
			
				
					
						
							
								attrs.pxd 
							
						
					 
				 
				
					
						
							
							Whitespace 
						
					 
				 
				2016-12-18 16:51:40 +01:00  
		
			
			
			
			
				
					
						
							
								attrs.pyx 
							
						
					 
				 
				
					
						
							
							Add more morphology names in attrs.pyx 
						
					 
				 
				2017-03-15 09:26:16 -05:00  
		
			
			
			
			
				
					
						
							
								cfile.pxd 
							
						
					 
				 
				
					
						
							
							Add hacky support for StringCFile, to make pickling easier. 
						
					 
				 
				2017-03-07 20:24:37 +01:00  
		
			
			
			
			
				
					
						
							
								cfile.pyx 
							
						
					 
				 
				
					
						
							
							Remove unused import statements 
						
					 
				 
				2017-03-21 21:08:54 +01:00  
		
			
			
			
			
				
					
						
							
								deprecated.py 
							
						
					 
				 
				
					
						
							
							Use correct command in deprecated download command message 
						
					 
				 
				2017-03-18 17:01:01 +01:00  
		
			
			
			
			
				
					
						
							
								gold.pxd 
							
						
					 
				 
				
					
						
							
							Fix gold.pyx for 1.0 
						
					 
				 
				2016-11-25 08:57:59 -06:00  
		
			
			
			
			
				
					
						
							
								gold.pyx 
							
						
					 
				 
				
					
						
							
							Remove unused import statements 
						
					 
				 
				2017-03-21 21:08:54 +01:00  
		
			
			
			
			
				
					
						
							
								language.py 
							
						
					 
				 
				
					
						
							
							Refactor Language.end_training, making new save_to_directory method 
						
					 
				 
				2017-04-14 23:51:24 +02:00  
		
			
			
			
			
				
					
						
							
								lemmatizer.py 
							
						
					 
				 
				
					
						
							
							Fix circular import in lemmatizer 
						
					 
				 
				2017-03-26 07:17:07 -05:00  
		
			
			
			
			
				
					
						
							
								lexeme.pxd 
							
						
					 
				 
				
					
						
							
							Remove stray .tensor attribute from Lexeme 
						
					 
				 
				2016-10-18 01:16:32 +02:00  
		
			
			
			
			
				
					
						
							
								lexeme.pyx 
							
						
					 
				 
				
					
						
							
							Remove whitespace 
						
					 
				 
				2017-04-01 10:21:08 +02:00  
		
			
			
			
			
				
					
						
							
								matcher.pyx 
							
						
					 
				 
				
					
						
							
							Add merge_phrase callback in matcher.pyx 
						
					 
				 
				2017-03-31 13:58:59 +02:00  
		
			
			
			
			
				
					
						
							
								morphology.pxd 
							
						
					 
				 
				
					
						
							
							Add support for Universal Dependencies v2.0 
						
					 
				 
				2017-03-03 13:17:34 +01:00  
		
			
			
			
			
				
					
						
							
								morphology.pyx 
							
						
					 
				 
				
					
						
							
							Fix errors in previous commit 
						
					 
				 
				2017-03-25 22:25:01 +01:00  
		
			
			
			
			
				
					
						
							
								multi_words.py 
							
						
					 
				 
				
					
						
							
							* Fix Issue  #50 : Python 3 compatibility of v0.80 
						
					 
				 
				2015-04-13 05:59:43 +02:00  
		
			
			
			
			
				
					
						
							
								orth.pxd 
							
						
					 
				 
				
					
						
							
							remove text-unidecode dependency 
						
					 
				 
				2016-02-24 08:01:59 +01:00  
		
			
			
			
			
				
					
						
							
								orth.pyx 
							
						
					 
				 
				
					
						
							
							Remove unused code 
						
					 
				 
				2017-03-12 13:58:22 +01:00  
		
			
			
			
			
				
					
						
							
								parts_of_speech.pxd 
							
						
					 
				 
				
					
						
							
							Add support for Universal Dependencies v2.0 
						
					 
				 
				2017-03-03 13:17:34 +01:00  
		
			
			
			
			
				
					
						
							
								parts_of_speech.pyx 
							
						
					 
				 
				
					
						
							
							Add support for Universal Dependencies v2.0 
						
					 
				 
				2017-03-03 13:17:34 +01:00  
		
			
			
			
			
				
					
						
							
								pipeline.pxd 
							
						
					 
				 
				
					
						
							
							Add classes for beam parser and beam NER 
						
					 
				 
				2017-03-11 12:45:37 -06:00  
		
			
			
			
			
				
					
						
							
								pipeline.pyx 
							
						
					 
				 
				
					
						
							
							WIP on add_label bug during NER training 
						
					 
				 
				2017-04-14 23:52:17 +02:00  
		
			
			
			
			
				
					
						
							
								scorer.py 
							
						
					 
				 
				
					
						
							
							Fix scorer bug for NER, related to ambiguity between missing annotations and misaligned tokens 
						
					 
				 
				2017-03-16 09:38:28 -05:00  
		
			
			
			
			
				
					
						
							
								strings.pxd 
							
						
					 
				 
				
					
						
							
							Update strings.pxd 
						
					 
				 
				2016-10-24 14:00:35 +02:00  
		
			
			
			
			
				
					
						
							
								strings.pyx 
							
						
					 
				 
				
					
						
							
							Add support for pickling StringStore. 
						
					 
				 
				2017-03-07 17:15:18 +01:00  
		
			
			
			
			
				
					
						
							
								structs.pxd 
							
						
					 
				 
				
					
						
							
							Initial, limited support for quantified patterns in Matcher, and tracking of ent_id attribute in Token and Span. The quantifiers need a lot more testing, and there are some known problems. The main known problem is that the zero-plus and one-plus quantifiers won't work if a token can match both the quantified pattern expression AND the tail of the match. 
						
					 
				 
				2016-09-21 14:54:55 +02:00  
		
			
			
			
			
				
					
						
							
								symbols.pxd 
							
						
					 
				 
				
					
						
							
							Add support for Universal Dependencies v2.0 
						
					 
				 
				2017-03-03 13:17:34 +01:00  
		
			
			
			
			
				
					
						
							
								symbols.pyx 
							
						
					 
				 
				
					
						
							
							Fix trailing whitespace on morphology features 
						
					 
				 
				2017-03-16 17:07:37 -05:00  
		
			
			
			
			
				
					
						
							
								tagger.pxd 
							
						
					 
				 
				
					
						
							
							Add cfg field to Tagger 
						
					 
				 
				2016-10-17 01:03:41 +02:00  
		
			
			
			
			
				
					
						
							
								tagger.pyx 
							
						
					 
				 
				
					
						
							
							Remove unused import statements 
						
					 
				 
				2017-03-21 21:08:54 +01:00  
		
			
			
			
			
				
					
						
							
								tokenizer.pxd 
							
						
					 
				 
				
					
						
							
							Revert "Revert "Merge remote-tracking branch 'origin/master'"" 
						
					 
				 
				2017-01-09 13:28:13 +01:00  
		
			
			
			
			
				
					
						
							
								tokenizer.pyx 
							
						
					 
				 
				
					
						
							
							Remove unused import statements 
						
					 
				 
				2017-03-21 21:08:54 +01:00  
		
			
			
			
			
				
					
						
							
								train.py 
							
						
					 
				 
				
					
						
							
							Don't reapply the model during training 
						
					 
				 
				2017-03-16 11:59:43 -05:00  
		
			
			
			
			
				
					
						
							
								typedefs.pxd 
							
						
					 
				 
				
					
						
							
							Revert "Work on Issue  #285 : intern strings into document-specific pools, to address streaming data memory growth. StringStore.__getitem__ now raises KeyError when it can't find the string. Use StringStore.intern() to get the old behaviour. Still need to hunt down all uses of StringStore.__getitem__ in library and do testing, but logic looks good." 
						
					 
				 
				2016-09-30 20:20:22 +02:00  
		
			
			
			
			
				
					
						
							
								typedefs.pyx 
							
						
					 
				 
				
					
						
							
							* Move POS tag definitions to parts_of_speech.pxd 
						
					 
				 
				2015-01-25 16:31:07 +11:00  
		
			
			
			
			
				
					
						
							
								util.py 
							
						
					 
				 
				
					
						
							
							Fix whitespace 
						
					 
				 
				2017-04-07 10:22:18 +02:00  
		
			
			
			
			
				
					
						
							
								vocab.pxd 
							
						
					 
				 
				
					
						
							
							Revert "Work on Issue  #285 : intern strings into document-specific pools, to address streaming data memory growth. StringStore.__getitem__ now raises KeyError when it can't find the string. Use StringStore.intern() to get the old behaviour. Still need to hunt down all uses of StringStore.__getitem__ in library and do testing, but logic looks good." 
						
					 
				 
				2016-09-30 20:20:22 +02:00  
		
			
			
			
			
				
					
						
							
								vocab.pyx 
							
						
					 
				 
				
					
						
							
							Merge branch 'master' of  https://github.com/explosion/spaCy 
						
					 
				 
				2017-03-17 18:30:53 +01:00