In [1]:
import spacy

nlp = spacy.blank("en")
doc = nlp("Asif hit 150 sixes in the nets. Scored a duck in the match")

for token in doc:
    print(token)

Asif
hit
150
sixes
in
the
nets
.
Scored
a
duck
in
the
match


In [2]:
nlp.pipe_names

[]

In [3]:
nlp = spacy.load("en_core_web_sm")

In [4]:
nlp.pipe_names

['tok2vec', 'tagger', 'parser', 'attribute_ruler', 'lemmatizer', 'ner']

In [5]:
nlp.pipeline

[('tok2vec', <spacy.pipeline.tok2vec.Tok2Vec at 0xa4138b5100>),
 ('tagger', <spacy.pipeline.tagger.Tagger at 0xa4138b5a00>),
 ('parser', <spacy.pipeline.dep_parser.DependencyParser at 0xa413a4acf0>),
 ('attribute_ruler',
  <spacy.pipeline.attributeruler.AttributeRuler at 0xa412e1d3c0>),
 ('lemmatizer', <spacy.lang.en.lemmatizer.EnglishLemmatizer at 0xa412e0b500>),
 ('ner', <spacy.pipeline.ner.EntityRecognizer at 0xa411b27970>)]

In [6]:
doc = nlp("Asif hit 150 sixes in the nets. Scored a duck in the match")

for token in doc:
    print(token, " | ", spacy.explain(token.pos_), " | ", token.lemma_)

Asif  |  proper noun  |  Asif
hit  |  verb  |  hit
150  |  numeral  |  150
sixes  |  noun  |  six
in  |  adposition  |  in
the  |  determiner  |  the
nets  |  noun  |  net
.  |  punctuation  |  .
Scored  |  verb  |  score
a  |  determiner  |  a
duck  |  noun  |  duck
in  |  adposition  |  in
the  |  determiner  |  the
match  |  noun  |  match


### Named Entity Recognition

In [8]:
doc = nlp("Tesla Inc. is going to buy twitter for $45 billion.")
for ent in doc.ents:
    print(ent.text, ent.label_)

Tesla Inc. ORG
$45 billion MONEY


In [9]:
from spacy import displacy

displacy.render(doc, style="ent")

### Adding a component to blank pipeline

In [10]:
source_nlp = spacy.load("en_core_web_sm")

In [11]:
nlp = spacy.blank("en")
nlp.add_pipe("ner", source=source_nlp)
nlp.pipe_names

['ner']

In [12]:
doc = nlp("Tesla Inc. is going to buy twitter for $45 billion.")
for ent in doc.ents:
    print(ent.text, ent.label_)

Tesla Inc. ORG
$45 billion MONEY
