spaCy/examples/pipeline/wiki_entity_linking/run_el.py

# coding: utf-8
from __future__ import unicode_literals

import spacy

# requires: pip install neuralcoref --no-binary neuralcoref
# import neuralcoref


# TODO
def add_coref():
    """ Add coreference resolution to our model """
    nlp = spacy.load('en_core_web_sm')
    # nlp = spacy.load('en')

    # TODO: this doesn't work yet
    # neuralcoref.add_to_pipe(nlp)
    print("done adding to pipe")

    doc = nlp(u'My sister has a dog. She loves him.')
    print("done doc")

    print(doc._.has_coref)
    print(doc._.coref_clusters)


# TODO
def _run_ner_depr(nlp, clean_text, article_dict):
    doc = nlp(clean_text)
    for ent in doc.ents:
        if ent.label_ == "PERSON":           # TODO: expand to non-persons
            ent_id = article_dict.get(ent.text)
            if ent_id:
                print(" -", ent.text, ent.label_, ent_id)
            else:
                print(" -", ent.text, ent.label_, '???')  # TODO: investigate these cases
refactor code to separate functionality into different files 2019-05-06 11:56:56 +03:00			`# coding: utf-8`
			`from __future__ import unicode_literals`

			`import spacy`

			`# requires: pip install neuralcoref --no-binary neuralcoref`
			`# import neuralcoref`


			`# TODO`
			`def add_coref():`
			`""" Add coreference resolution to our model """`
			`nlp = spacy.load('en_core_web_sm')`
			`# nlp = spacy.load('en')`

			`# TODO: this doesn't work yet`
			`# neuralcoref.add_to_pipe(nlp)`
			`print("done adding to pipe")`

			`doc = nlp(u'My sister has a dog. She loves him.')`
			`print("done doc")`

			`print(doc._.has_coref)`
			`print(doc._.coref_clusters)`


			`# TODO`
			`def _run_ner_depr(nlp, clean_text, article_dict):`
			`doc = nlp(clean_text)`
			`for ent in doc.ents:`
			`if ent.label_ == "PERSON": # TODO: expand to non-persons`
			`ent_id = article_dict.get(ent.text)`
			`if ent_id:`
			`print(" -", ent.text, ent.label_, ent_id)`
			`else:`
			`print(" -", ent.text, ent.label_, '???') # TODO: investigate these cases`