mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-11 04:08:09 +03:00
Fix size limits in training data
This commit is contained in:
parent
8446b35ce0
commit
f328c195ca
|
@ -160,7 +160,7 @@ class GoldCorpus(object):
|
|||
yield item
|
||||
i += len(item[1])
|
||||
if limit and i >= limit:
|
||||
break
|
||||
return
|
||||
|
||||
@property
|
||||
def dev_tuples(self):
|
||||
|
@ -178,9 +178,9 @@ class GoldCorpus(object):
|
|||
for raw_text, paragraph_tuples in self.train_tuples:
|
||||
for sent_tuples, brackets in paragraph_tuples:
|
||||
n += len(sent_tuples[1])
|
||||
if self.limit and i >= self.limit:
|
||||
break
|
||||
i += len(paragraph_tuples)
|
||||
if self.limit and i >= self.limit:
|
||||
break
|
||||
i += 1
|
||||
return n
|
||||
|
||||
def train_docs(self, nlp, gold_preproc=False, max_length=None,
|
||||
|
|
Loading…
Reference in New Issue
Block a user