In [1]:
import spacy

nlp = spacy.blank("en")

doc = nlp("The sun did gaze upon the peasants toiling in the fields, and one of them spake, 'I shall not yield, though the sun doth smile upon me.'")

for token in doc:
    print(token)

The
sun
did
gaze
upon
the
peasants
toiling
in
the
fields
,
and
one
of
them
spake
,
'
I
shall
not
yield
,
though
the
sun
doth
smile
upon
me
.
'


In [4]:
nlp.pipe_names

[]

In [6]:
nlp = spacy.load("en_core_web_sm")
nlp.pipe_names

['tok2vec', 'tagger', 'parser', 'attribute_ruler', 'lemmatizer', 'ner']

In [7]:
nlp.pipeline

[('tok2vec', <spacy.pipeline.tok2vec.Tok2Vec at 0x1151daab0>),
 ('tagger', <spacy.pipeline.tagger.Tagger at 0x1151da870>),
 ('parser', <spacy.pipeline.dep_parser.DependencyParser at 0x1152358c0>),
 ('attribute_ruler',
  <spacy.pipeline.attributeruler.AttributeRuler at 0x11536d9d0>),
 ('lemmatizer', <spacy.lang.en.lemmatizer.EnglishLemmatizer at 0x11537c450>),
 ('ner', <spacy.pipeline.ner.EntityRecognizer at 0x1152359a0>)]

In [8]:
doc = nlp("The sun did gaze upon the peasants toiling in the fields, and one of them spake, 'I shall not yield, though the sun doth smile upon me.'")

for token in doc:
    print(token, " | ", spacy.explain(token.pos_), " | ", token.lemma_)

The  |  determiner  |  the
sun  |  noun  |  sun
did  |  auxiliary  |  do
gaze  |  verb  |  gaze
upon  |  subordinating conjunction  |  upon
the  |  determiner  |  the
peasants  |  noun  |  peasant
toiling  |  verb  |  toil
in  |  adposition  |  in
the  |  determiner  |  the
fields  |  noun  |  field
,  |  punctuation  |  ,
and  |  coordinating conjunction  |  and
one  |  numeral  |  one
of  |  adposition  |  of
them  |  pronoun  |  they
spake  |  adjective  |  spake
,  |  punctuation  |  ,
'  |  punctuation  |  '
I  |  pronoun  |  I
shall  |  auxiliary  |  shall
not  |  particle  |  not
yield  |  verb  |  yield
,  |  punctuation  |  ,
though  |  subordinating conjunction  |  though
the  |  determiner  |  the
sun  |  noun  |  sun
doth  |  noun  |  doth
smile  |  noun  |  smile
upon  |  subordinating conjunction  |  upon
me  |  pronoun  |  I
.  |  punctuation  |  .
'  |  punctuation  |  '


Named Entity Recognition

In [15]:
doc = nlp("Tata steel founder is Mr. Ratan Tata")
for ent in doc.ents:
    print(ent.text, ent.label_)

Tata ORG
Ratan Tata PERSON


In [16]:
from spacy import displacy

displacy.render(doc, style="ent")

Trained processing pipeline in French

In [17]:
nlp = spacy.load("fr_core_news_sm")

In [18]:
doc = nlp("Tesla Inc va racheter Twitter pour $45 milliards de dollars")
for ent in doc.ents:
    print(ent.text, " | ", ent.label_, " | ", spacy.explain(ent.label_))

Tesla Inc  |  PER  |  Named person or family.
Twitter  |  MISC  |  Miscellaneous entities, e.g. events, nationalities, products or works of art


In [19]:
for token in doc:
    print(token, " | ", token.pos_, " | ", token.lemma_)

Tesla  |  PROPN  |  Tesla
Inc  |  PROPN  |  Inc
va  |  VERB  |  aller
racheter  |  VERB  |  racheter
Twitter  |  VERB  |  twitter
pour  |  ADP  |  pour
$  |  NOUN  |  dollar
45  |  NUM  |  45
milliards  |  NOUN  |  milliard
de  |  ADP  |  de
dollars  |  NOUN  |  dollar
