In [1]:
import spacy

nlp = spacy.load("en_core_web_sm") 

In [2]:
nlp.pipe_names

['tok2vec', 'tagger', 'parser', 'attribute_ruler', 'lemmatizer', 'ner']

In [3]:
nlp.pipeline

[('tok2vec', <spacy.pipeline.tok2vec.Tok2Vec at 0x1565bdcae10>),
 ('tagger', <spacy.pipeline.tagger.Tagger at 0x1565b77c530>),
 ('parser', <spacy.pipeline.dep_parser.DependencyParser at 0x1565e388b30>),
 ('attribute_ruler',
  <spacy.pipeline.attributeruler.AttributeRuler at 0x1565e613750>),
 ('lemmatizer', <spacy.lang.en.lemmatizer.EnglishLemmatizer at 0x1565e63f2d0>),
 ('ner', <spacy.pipeline.ner.EntityRecognizer at 0x1565e388dd0>)]

In [4]:
doc = nlp("Captain america ate 100$ of samosa. Then he said I can do this all day.")

for token in doc:
    print(token, " | ", spacy.explain(token.pos_), " | ", token.lemma_)

Captain  |  proper noun  |  Captain
america  |  proper noun  |  america
ate  |  verb  |  eat
100  |  numeral  |  100
$  |  numeral  |  $
of  |  adposition  |  of
samosa  |  proper noun  |  samosa
.  |  punctuation  |  .
Then  |  adverb  |  then
he  |  pronoun  |  he
said  |  verb  |  say
I  |  pronoun  |  I
can  |  auxiliary  |  can
do  |  verb  |  do
this  |  pronoun  |  this
all  |  determiner  |  all
day  |  noun  |  day
.  |  punctuation  |  .


NER

In [5]:
doc = nlp("Tesla Inc is going to acquire twitter for $45 billion")
for ent in doc.ents:
    print(ent.text, ent.label_)

Tesla Inc ORG
$45 billion MONEY


In [6]:
doc = nlp("Tesla Inc va racheter Twitter pour $45 milliards de dollars")
for ent in doc.ents:
    print(ent.text, " | ", ent.label_, " | ", spacy.explain(ent.label_))

Tesla Inc va  |  ORG  |  Companies, agencies, institutions, etc.
Twitter  |  PERSON  |  People, including fictional
$45 milliards de dollars  |  MONEY  |  Monetary values, including unit


In [7]:
for token in doc:
    print(token, " | ", token.pos_, " | ", token.lemma_)

Tesla  |  PROPN  |  Tesla
Inc  |  PROPN  |  Inc
va  |  PROPN  |  va
racheter  |  NOUN  |  racheter
Twitter  |  PROPN  |  Twitter
pour  |  VERB  |  pour
$  |  SYM  |  $
45  |  NUM  |  45
milliards  |  NOUN  |  milliard
de  |  ADP  |  de
dollars  |  NOUN  |  dollar


In [8]:
source_nlp = spacy.load("en_core_web_sm")

nlp = spacy.blank("en")
nlp.add_pipe("ner", source=source_nlp)
nlp.pipe_names

['ner']

In [9]:
text = '''Ravi and Raju are the best friends from school days.They wanted to go for a world tour and 
visit famous cities like Paris, London, Dubai, Rome etc and also they called their another friend Mohan to take part of this world tour.
They started their journey from Hyderabad and spent next 3 months travelling all the wonderful cities in the world and cherish a happy moments!
'''
doc = nlp(text)  
all_proper_nouns = [] 
for token in doc:
  if token.pos_ == "PROPN":       
    all_proper_nouns.append(token)
print("Proper Nouns: ", all_proper_nouns)
print("Count: ", len(all_proper_nouns))

Proper Nouns:  []
Count:  0
