mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-10 19:57:17 +03:00
Fix inconsistent label freq cutoff for projectivisation
This commit is contained in:
parent
7b66ec896a
commit
b8d52cb285
|
@ -133,10 +133,10 @@ class GoldCorpus(object):
|
|||
def train_docs(self, nlp, gold_preproc=False,
|
||||
projectivize=False, max_length=None,
|
||||
noise_level=0.0):
|
||||
train_tuples = self.train_tuples
|
||||
train_tuples = list(self.train_tuples)
|
||||
if projectivize:
|
||||
train_tuples = nonproj.preprocess_training_data(
|
||||
self.train_tuples, label_freq_cutoff=100)
|
||||
self.train_tuples, label_freq_cutoff=30)
|
||||
random.shuffle(train_tuples)
|
||||
gold_docs = self.iter_gold_docs(nlp, train_tuples, gold_preproc,
|
||||
max_length=max_length,
|
||||
|
|
Loading…
Reference in New Issue
Block a user