Merge pull request #629 from kylepjohnson/master

Fix attribute error in nn_text_class.py, add module docstring
2025-11-06 19:07:30 +03:00 · 2016-11-14 05:26:56 +11:00 · 2016-11-14 05:26:56 +11:00 · 901a96f7cd
commit 901a96f7cd
parent 12a7b05360 d105771a07
1 changed files with 9 additions and 1 deletions
--- a/examples/nn_text_class.py
+++ b/examples/nn_text_class.py
@ -1,3 +1,11 @@
+"""This script expects something like a binary sentiment data set, such as
+ that available here: `http://www.cs.cornell.edu/people/pabo/movie-review-data/`
+
+It expects a directory structure like: `data_dir/train/{pos|neg}`
+ and `data_dir/test/{pos|neg}`. Put (say) 90% of the files in the former
+ and the remainder in the latter.
+"""
+
 from __future__ import unicode_literals
 from __future__ import print_function
 from __future__ import division
@ -56,7 +64,7 @@ class Extractor(object):
        self.vector.fill(0)
        n = 0
        for orth_id, freq in bow.items():
-            self.vector += self.nlp.vocab[self.nlp.vocab.strings[orth_id]].repvec * freq
+            self.vector += self.nlp.vocab[self.nlp.vocab.strings[orth_id]].vector * freq
            # Apply the fine-tuning we've learned
            if orth_id < E.shape[0]:
                self.vector += E[orth_id] * freq