mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-11 04:08:09 +03:00
slightly more challenging unit test
This commit is contained in:
parent
6651fafd5c
commit
6208d322d3
|
@ -12,8 +12,8 @@ from spacy.util import minibatch_by_words
|
|||
([400, 400, 199], [3]),
|
||||
([400, 400, 199, 3], [4]),
|
||||
([400, 400, 199, 3, 1], [5]),
|
||||
([400, 400, 199, 3, 250], [3, 2]),
|
||||
([400, 400, 199, 3, 1, 250], [3, 3]),
|
||||
([400, 400, 199, 3, 200], [3, 2]),
|
||||
([400, 400, 199, 3, 1, 200], [3, 3]),
|
||||
],
|
||||
)
|
||||
def test_util_minibatch(doc_sizes, expected_batches):
|
||||
|
|
|
@ -682,13 +682,13 @@ def minibatch_by_words(examples, size, count_words=len, tolerance=0.2, discard_o
|
|||
if not discard_oversize:
|
||||
yield [example]
|
||||
|
||||
# add the example to the current batch if it still fits
|
||||
elif (current_size + n_words) < target_size:
|
||||
# add the example to the current batch if it still fits and there's no overflow yet
|
||||
elif overflow_size == 0 and (current_size + n_words) < target_size:
|
||||
batch.append(example)
|
||||
current_size += n_words
|
||||
|
||||
# add the example to the overflow buffer if it fits in the tolerance margins
|
||||
elif (current_size + n_words) < (target_size + tol_size):
|
||||
elif (current_size + overflow_size + n_words) < (target_size + tol_size):
|
||||
overflow.append(example)
|
||||
overflow_size += n_words
|
||||
|
||||
|
|
Loading…
Reference in New Issue
Block a user