In [15]:
import spacy
from spacy import displacy

In [16]:
nlp = spacy.load("en_core_web_sm")
nlp.pipe_names

['tok2vec', 'tagger', 'parser', 'attribute_ruler', 'lemmatizer', 'ner']

In [17]:
doc = nlp("Tesla Inc is going to buy Twitter Inc for $45 billion.")

In [18]:
for entity in doc.ents:
    print(entity.text, " | ", entity.label_, " | ", spacy.explain(entity.label_))

Tesla Inc  |  ORG  |  Companies, agencies, institutions, etc.
Twitter Inc  |  ORG  |  Companies, agencies, institutions, etc.
$45 billion  |  MONEY  |  Monetary values, including unit


## Beautifully show entities

In [23]:

displacy.render(doc, style="ent")

# Pre-defined entities in ner 

In [22]:

nlp.pipe_labels['ner']

['CARDINAL',
 'DATE',
 'EVENT',
 'FAC',
 'GPE',
 'LANGUAGE',
 'LAW',
 'LOC',
 'MONEY',
 'NORP',
 'ORDINAL',
 'ORG',
 'PERCENT',
 'PERSON',
 'PRODUCT',
 'QUANTITY',
 'TIME',
 'WORK_OF_ART']

In [24]:
doc = nlp("Michael Bloomberg founded Bloomberg in 1982.")

In [25]:
for entity in doc.ents:
    print(entity.text, " | ", entity.label_, " | ", spacy.explain(entity.label_))

Michael Bloomberg  |  PERSON  |  People, including fictional
Bloomberg  |  PERSON  |  People, including fictional
1982  |  DATE  |  Absolute or relative dates or periods


## Setting Custom entity -  Tesla and Twitter are not recognized here

In [28]:

doc = nlp("Tesla is going to buy Twitter for $45 billion.")
for entity in doc.ents:
    print(entity.text, " | ", entity.label_, " | ", spacy.explain(entity.label_))

$45 billion  |  MONEY  |  Monetary values, including unit


In [30]:
type(doc[:1])

spacy.tokens.span.Span

In [31]:
doc[:1]

Tesla

In [33]:
doc[5:6]

Twitter

In [37]:
from spacy.tokens import Span

s1 = Span(doc, 0, 1, label = "ORG")
s2 = Span(doc, 5, 6, label = "ORG")

doc.set_ents([s1, s2], default="unmodified")

## Custom entities detected

In [38]:
for entity in doc.ents:
    print(entity.text, " | ", entity.label_, " | ", spacy.explain(entity.label_))

Tesla  |  ORG  |  Companies, agencies, institutions, etc.
Twitter  |  ORG  |  Companies, agencies, institutions, etc.
$45 billion  |  MONEY  |  Monetary values, including unit


## Building own NER - " EntityRuler " class