In [1]:
import spacy

nlp = spacy.load("en_core_web_sm")

In [2]:
doc = nlp("Tesla Inc is acquired Twitter for 45$ Billon.")

for token in doc.ents:
    print(token, " | ", token.label_, " | ", spacy.explain(token.label_))

Tesla Inc  |  ORG  |  Companies, agencies, institutions, etc.
Twitter  |  PRODUCT  |  Objects, vehicles, foods, etc. (not services)
45$ Billon  |  MONEY  |  Monetary values, including unit


In [3]:
doc = nlp("Tesla Inc is acquired Twitter Inc for 45$ Billon.")

for token in doc.ents:
    print(token, " | ", token.label_, " | ", spacy.explain(token.label_))

Tesla Inc  |  ORG  |  Companies, agencies, institutions, etc.
Twitter Inc  |  ORG  |  Companies, agencies, institutions, etc.
45$ Billon  |  MONEY  |  Monetary values, including unit


In [4]:
# Adding style
from spacy import displacy
displacy.render(doc, style="ent")

In [5]:
# Get "ner" pipeline's attribute
nlp.pipe_labels['ner']

['CARDINAL',
 'DATE',
 'EVENT',
 'FAC',
 'GPE',
 'LANGUAGE',
 'LAW',
 'LOC',
 'MONEY',
 'NORP',
 'ORDINAL',
 'ORG',
 'PERCENT',
 'PERSON',
 'PRODUCT',
 'QUANTITY',
 'TIME',
 'WORK_OF_ART']

# Customizing Entity

In [6]:
doc = nlp("Tesla is acquired Twitter for 45$ Billon.")

for token in doc.ents:
    print(token.text, " | ", token.label_, " | ", spacy.explain(token.label_))

Tesla  |  ORG  |  Companies, agencies, institutions, etc.
Twitter  |  PRODUCT  |  Objects, vehicles, foods, etc. (not services)
45$ Billon  |  MONEY  |  Monetary values, including unit


In [7]:
doc[0]

Tesla

In [8]:
type(doc[0])

spacy.tokens.token.Token

In [9]:
doc[2:4]

acquired Twitter

In [10]:
type(doc[2:4])

spacy.tokens.span.Span

In [11]:
from spacy.tokens import Span

s1 = Span(doc, 0, 1, label="Org")
s2 = Span(doc, 3, 4, label="Org")

doc.set_ents([s1, s2], default="unmodified")

In [12]:
for token in doc.ents:
    print(token.text, " | ", token.label_, " | ", spacy.explain(token.label_))

Tesla  |  Org  |  None
Twitter  |  Org  |  None
45$ Billon  |  MONEY  |  Monetary values, including unit




In [13]:
# Adding style
from spacy import displacy
displacy.render(doc, style="ent")