In [1]:
import spacy

In [2]:
nlp = spacy.load('en_core_web_sm')

In [3]:
nlp.pipe_names

['tok2vec', 'tagger', 'parser', 'attribute_ruler', 'lemmatizer', 'ner']

In [4]:
text = nlp("Tesla Inc is going to acquire twitter for $45 billion")

for ent in text.ents:
  print(ent.text, " | ", ent.label_, " | ", spacy.explain(ent.label_))

Tesla Inc  |  ORG  |  Companies, agencies, institutions, etc.
$45 billion  |  MONEY  |  Monetary values, including unit


In [5]:
text1 = nlp("Tesla Inc is going to acquire twitter for forty five billion dollars")

for ent in text.ents:
  print(ent.text, " | ", ent.label_, " | ", spacy.explain(ent.label_))

Tesla Inc  |  ORG  |  Companies, agencies, institutions, etc.
$45 billion  |  MONEY  |  Monetary values, including unit


In [6]:
from spacy import displacy

displacy.render(text, style="ent")

In [7]:
text2 = nlp("Elon Musk runs an organisation named Tesla")

from spacy import displacy

displacy.render(text2, style="ent")

In [8]:
nlp.pipe_labels['ner']

['CARDINAL',
 'DATE',
 'EVENT',
 'FAC',
 'GPE',
 'LANGUAGE',
 'LAW',
 'LOC',
 'MONEY',
 'NORP',
 'ORDINAL',
 'ORG',
 'PERCENT',
 'PERSON',
 'PRODUCT',
 'QUANTITY',
 'TIME',
 'WORK_OF_ART']

In [9]:
doc = nlp("Michael Bloomberg founded Bloomberg in 1982")

from spacy import displacy

displacy.render(doc, style="ent")

### Setting own entities

In [10]:
doc = nlp("Tesla Inc is going to acquire twitter for $45 billion")
for ent in doc.ents:
  print(ent.text, " | ", ent.label_)

Tesla Inc  |  ORG
$45 billion  |  MONEY


In [11]:
s = doc[3:6]
s

going to acquire

In [12]:
type(s)

spacy.tokens.span.Span

In [13]:
from spacy.tokens import Span

s1 = Span(doc, 0, 2, label='ORG')
s2 = Span(doc, 8,11, label='ORG')

doc.set_ents([s1,s2], default='unmodified')

In [14]:
for ent in doc.ents:
  print(ent.text, " | ", ent.label_)

Tesla Inc  |  ORG
$45 billion  |  ORG


In [16]:
text2 = nlp("Arin Sharma runs an organisation named Arin Foundation")

s1 = Span(doc, 0, 2, label='PERSON')
s2 = Span(doc, 6,8, label='ORG')

text2.set_ents([s1,s2], default='unmodified')

from spacy import displacy

displacy.render(text2, style="ent")