spaCy/sandbox_test_sofie/testing_el.py

27 lines
609 B
Python
Raw Normal View History

import spacy
def add_el():
nlp = spacy.load('en_core_web_sm')
2019-03-14 17:48:40 +03:00
print("pipes before:", nlp.pipe_names)
el_pipe = nlp.create_pipe(name='el')
nlp.add_pipe(el_pipe, last=True)
2019-03-14 17:48:40 +03:00
print("pipes after:", nlp.pipe_names)
print()
2019-03-14 17:48:40 +03:00
text = "The Hitchhiker's Guide to the Galaxy, written by Douglas Adams, reminds us to always bring our towel."
doc = nlp(text)
2019-03-14 17:48:40 +03:00
for token in doc:
2019-03-14 17:48:40 +03:00
print("token", token.text, token.ent_type_, token.ent_kb_id_)
print()
for ent in doc.ents:
print("ent", ent.text, ent.label_, ent.kb_id_)
if __name__ == "__main__":
add_el()