mirror of
https://github.com/explosion/spaCy.git
synced 2025-06-29 01:13:17 +03:00
Fix size limits in training data
This commit is contained in:
parent
8446b35ce0
commit
f328c195ca
|
@ -160,7 +160,7 @@ class GoldCorpus(object):
|
||||||
yield item
|
yield item
|
||||||
i += len(item[1])
|
i += len(item[1])
|
||||||
if limit and i >= limit:
|
if limit and i >= limit:
|
||||||
break
|
return
|
||||||
|
|
||||||
@property
|
@property
|
||||||
def dev_tuples(self):
|
def dev_tuples(self):
|
||||||
|
@ -180,7 +180,7 @@ class GoldCorpus(object):
|
||||||
n += len(sent_tuples[1])
|
n += len(sent_tuples[1])
|
||||||
if self.limit and i >= self.limit:
|
if self.limit and i >= self.limit:
|
||||||
break
|
break
|
||||||
i += len(paragraph_tuples)
|
i += 1
|
||||||
return n
|
return n
|
||||||
|
|
||||||
def train_docs(self, nlp, gold_preproc=False, max_length=None,
|
def train_docs(self, nlp, gold_preproc=False, max_length=None,
|
||||||
|
|
Loading…
Reference in New Issue
Block a user