mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-26 17:24:41 +03:00
Fix handling of preset entities in NER
* Fix check of valid ent_type for B * Add valid L as preset-I followed by not-I
This commit is contained in:
parent
419ae59c79
commit
6b0fec76fd
|
@ -258,7 +258,7 @@ cdef class Begin:
|
||||||
@staticmethod
|
@staticmethod
|
||||||
cdef bint is_valid(const StateC* st, attr_t label) nogil:
|
cdef bint is_valid(const StateC* st, attr_t label) nogil:
|
||||||
cdef int preset_ent_iob = st.B_(0).ent_iob
|
cdef int preset_ent_iob = st.B_(0).ent_iob
|
||||||
cdef int preset_ent_label = st.B_(0).ent_type
|
cdef attr_t preset_ent_label = st.B_(0).ent_type
|
||||||
# If we're the last token of the input, we can't B -- must U or O.
|
# If we're the last token of the input, we can't B -- must U or O.
|
||||||
if st.B(1) == -1:
|
if st.B(1) == -1:
|
||||||
return False
|
return False
|
||||||
|
@ -395,6 +395,9 @@ cdef class Last:
|
||||||
return False
|
return False
|
||||||
elif not st.entity_is_open():
|
elif not st.entity_is_open():
|
||||||
return False
|
return False
|
||||||
|
elif st.B_(0).ent_iob == 1 and st.B_(1).ent_iob != 1:
|
||||||
|
# If a preset entity has I followed by not-I, is L
|
||||||
|
return True
|
||||||
elif st.E_(0).ent_type != label:
|
elif st.E_(0).ent_type != label:
|
||||||
return False
|
return False
|
||||||
elif st.B_(1).ent_iob == 1:
|
elif st.B_(1).ent_iob == 1:
|
||||||
|
|
Loading…
Reference in New Issue
Block a user