formatting

This commit is contained in:
Peter Baumgartner 2023-01-24 13:34:31 -05:00
parent 7a0faed7a7
commit de6e29ae8f

View File

@ -1208,11 +1208,12 @@ def test_walk_directory():
assert (len(walk_directory(d, suffix="conll"))) == 3
assert (len(walk_directory(d, suffix="pdf"))) == 0
def test_debug_data_trainable_lemmatizer_basic():
examples = [
("She likes green eggs", {"lemmas": ["she", "like", "green", "egg"]}),
("Eat blue ham", {"lemmas": ["eat", "blue", "ham"]}),
]
]
nlp = Language()
train_examples = []
for t in examples:
@ -1223,6 +1224,7 @@ def test_debug_data_trainable_lemmatizer_basic():
# this results in 4 trees
assert len(data["lemmatizer_trees"]) == 4
def test_debug_data_trainable_lemmatizer_partial():
partial_examples = [
# partial annotation
@ -1244,6 +1246,7 @@ def test_debug_data_trainable_lemmatizer_partial():
data = _compile_gold(train_examples, ["trainable_lemmatizer"], nlp, True)
assert data["partial_lemma_annotations"] == 2
def test_debug_data_trainable_lemmatizer_low_cardinality():
low_cardinality_examples = [
("She likes green eggs", {"lemmas": ["no", "no", "no", "no"]}),
@ -1257,6 +1260,7 @@ def test_debug_data_trainable_lemmatizer_low_cardinality():
data = _compile_gold(train_examples, ["trainable_lemmatizer"], nlp, True)
assert data["n_low_cardinality_lemmas"] == 2
def test_debug_data_trainable_lemmatizer_not_annotated():
unannotated_examples = [
("She likes green eggs", {}),