Update hash strings examples

This commit is contained in:
ines 2017-05-28 19:42:44 +02:00
parent c7b57ea314
commit 606879b217
4 changed files with 28 additions and 18 deletions

View File

@ -113,9 +113,11 @@ p Add a string to the #[code StringStore].
+aside-code("Example").
stringstore = StringStore([u'apple', u'orange'])
stringstore.add(u'banana')
banana_hash = stringstore.add(u'banana')
assert len(stringstore) == 3
assert stringstore[u'banana'] == 2525716904149915114L
assert banana_hash == 2525716904149915114L
assert stringstore[banana_hash] == u'banana'
assert stringstore[u'banana'] == banana_hash
+table(["Name", "Type", "Description"])
+row

View File

@ -52,15 +52,15 @@ p
assert ent_san == [u'San', u'B', u'GPE']
assert ent_francisco == [u'Francisco', u'I', u'GPE']
+table(["Text", "ent_iob", "ent_iob_", "ent_type", "ent_type_", "Description"])
+table(["Text", "ent_iob", "ent_iob_", "ent_type_", "Description"])
- var style = [0, 1, 1, 1, 1, 0]
+annotation-row(["San", 3, "B", 381, "GPE", "beginning of an entity"], style)
+annotation-row(["Francisco", 1, "I", 381, "GPE", "inside an entity"], style)
+annotation-row(["considers", 2, "O", 0, '""', "outside an entity"], style)
+annotation-row(["banning", 2, "O", 0, '""', "outside an entity"], style)
+annotation-row(["sidewalk", 2, "O", 0, '""', "outside an entity"], style)
+annotation-row(["delivery", 2, "O", 0, '""', "outside an entity"], style)
+annotation-row(["robots", 2, "O", 0, '""', "outside an entity"], style)
+annotation-row(["San", 3, "B", "GPE", "beginning of an entity"], style)
+annotation-row(["Francisco", 1, "I", "GPE", "inside an entity"], style)
+annotation-row(["considers", 2, "O", '""', "outside an entity"], style)
+annotation-row(["banning", 2, "O", '""', "outside an entity"], style)
+annotation-row(["sidewalk", 2, "O", '""', "outside an entity"], style)
+annotation-row(["delivery", 2, "O", '""', "outside an entity"], style)
+annotation-row(["robots", 2, "O", '""', "outside an entity"], style)
+h(2, "setting") Setting entity annotations
@ -148,6 +148,8 @@ include ../api/_annotation/_named-entities
+h(2, "updating") Training and updating
+under-construction
p
| To provide training examples to the entity recogniser, you'll first need
| to create an instance of the #[+api("goldparse") #[code GoldParse]] class.
@ -173,7 +175,6 @@ p
nlp.tagger(doc)
ner.update(doc, gold)
ner.model.end_training()
p
| If a character offset in your entity annotations don't fall on a token

View File

@ -53,9 +53,9 @@ p
+code.
doc = nlp(u'Apple is looking at buying U.K. startup for $1 billion')
apple = doc[0]
assert [apple.pos_, apple.pos] == [u'PROPN', 94]
assert [apple.tag_, apple.tag] == [u'NNP', 475]
assert [apple.shape_, apple.shape] == [u'Xxxxx', 684]
assert [apple.pos_, apple.pos] == [u'PROPN', 17049293600679659579L]
assert [apple.tag_, apple.tag] == [u'NNP', 15794550382381185553L]
assert [apple.shape_, apple.shape] == [u'Xxxxx', 16072095006890171862L]
assert apple.is_alpha == True
assert apple.is_punct == False
@ -78,10 +78,16 @@ p
assert doc[2].orth == coffee_hash == 3197928453018144401L
assert doc[2].text == coffee_text == u'coffee'
doc.vocab.strings.add(u'beer')
beer_hash = doc.vocab.strings[u'beer'] # 3073001599257881079L
beer_hash = doc.vocab.strings.add(u'beer') # 3073001599257881079L
beer_text = doc.vocab.strings[beer_hash] # 'beer'
unicorn_hash = doc.vocab.strings.add(u'🦄 ') # 18234233413267120783L
unicorn_text = doc.vocab.strings[unicorn_hash] # '🦄 '
+infobox
| #[strong API:] #[+api("stringstore") #[code stringstore]]
| #[strong Usage:] #[+a("/docs/usage/spacy-101#vocab") Vocab, hashes and lexemes 101]
+h(2, "examples-entities") Recongnise and update named entities
+tag-model("NER")

View File

@ -57,8 +57,9 @@ p
assert doc.vocab.strings[u'coffee'] == 3197928453018144401L
assert doc.vocab.strings[3197928453018144401L] == u'coffee'
doc.vocab.strings.add(u'beer')
assert doc.vocab.strings[u'beer'] == 3073001599257881079L
beer_hash = doc.vocab.strings.add(u'beer')
assert doc.vocab.strings[u'beer'] == beer_hash
assert doc.vocab.strings[beer_hash] == u'beer'
p
| The #[+api("stringstore") #[code StringStore]] now resolves all strings