From 031b00cb91384c6014cd13673ec737930c38f2b5 Mon Sep 17 00:00:00 2001 From: Matthew Honnibal Date: Fri, 5 Feb 2016 20:12:09 +0100 Subject: [PATCH] * Fix Span.root calculation --- spacy/tests/website/test_api.py | 2 +- spacy/tokens/span.pyx | 6 ------ 2 files changed, 1 insertion(+), 7 deletions(-) diff --git a/spacy/tests/website/test_api.py b/spacy/tests/website/test_api.py index 6a7379d87..fc5eb3c7a 100644 --- a/spacy/tests/website/test_api.py +++ b/spacy/tests/website/test_api.py @@ -150,7 +150,7 @@ def test_example_i_like_new_york5(toks, autumn, dot): assert toks[autumn].head.orth_ == 'in' assert toks[dot].head.orth_ == 'like' autumn_dot = toks[autumn:] - assert autumn_dot.root.orth_ == 'Autumn' + assert autumn_dot.root.orth_ == '.' def test_navigating_the_parse_tree_lefts(doc): diff --git a/spacy/tokens/span.pyx b/spacy/tokens/span.pyx index 801c98523..82501dbc5 100644 --- a/spacy/tokens/span.pyx +++ b/spacy/tokens/span.pyx @@ -241,12 +241,6 @@ cdef class Span: cdef int _count_words_to_root(const TokenC* token, int sent_length) except -1: - # Don't allow spaces to be the root, if there are - # better candidates - if Lexeme.c_check_flag(token.lex, IS_SPACE) and token.l_kids == 0 and token.r_kids == 0: - return sent_length-1 - if Lexeme.c_check_flag(token.lex, IS_PUNCT) and token.l_kids == 0 and token.r_kids == 0: - return sent_length-1 cdef int n = 0 while token.head != 0: token += token.head