mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-11-04 01:48:04 +03:00 
			
		
		
		
	Merge pull request #629 from kylepjohnson/master
Fix attribute error in nn_text_class.py, add module docstring
This commit is contained in:
		
						commit
						901a96f7cd
					
				| 
						 | 
					@ -1,3 +1,11 @@
 | 
				
			||||||
 | 
					"""This script expects something like a binary sentiment data set, such as
 | 
				
			||||||
 | 
					 that available here: `http://www.cs.cornell.edu/people/pabo/movie-review-data/`
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					It expects a directory structure like: `data_dir/train/{pos|neg}`
 | 
				
			||||||
 | 
					 and `data_dir/test/{pos|neg}`. Put (say) 90% of the files in the former
 | 
				
			||||||
 | 
					 and the remainder in the latter.
 | 
				
			||||||
 | 
					"""
 | 
				
			||||||
 | 
					
 | 
				
			||||||
from __future__ import unicode_literals
 | 
					from __future__ import unicode_literals
 | 
				
			||||||
from __future__ import print_function
 | 
					from __future__ import print_function
 | 
				
			||||||
from __future__ import division
 | 
					from __future__ import division
 | 
				
			||||||
| 
						 | 
					@ -56,7 +64,7 @@ class Extractor(object):
 | 
				
			||||||
        self.vector.fill(0)
 | 
					        self.vector.fill(0)
 | 
				
			||||||
        n = 0
 | 
					        n = 0
 | 
				
			||||||
        for orth_id, freq in bow.items():
 | 
					        for orth_id, freq in bow.items():
 | 
				
			||||||
            self.vector += self.nlp.vocab[self.nlp.vocab.strings[orth_id]].repvec * freq
 | 
					            self.vector += self.nlp.vocab[self.nlp.vocab.strings[orth_id]].vector * freq
 | 
				
			||||||
            # Apply the fine-tuning we've learned
 | 
					            # Apply the fine-tuning we've learned
 | 
				
			||||||
            if orth_id < E.shape[0]:
 | 
					            if orth_id < E.shape[0]:
 | 
				
			||||||
                self.vector += E[orth_id] * freq
 | 
					                self.vector += E[orth_id] * freq
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
		Loading…
	
		Reference in New Issue
	
	Block a user