In [2]:
import spacy

In [3]:
nlp = spacy.load ('en_core_web_sm')

In [4]:
doc = nlp (u'Tesla is looking at buying U.S. Startup for $6 million')

In [7]:
for token in doc:
    print (token, token.pos_)

Tesla PROPN
is VERB
looking VERB
at ADP
buying VERB
U.S. PROPN
Startup PROPN
for ADP
$ SYM
6 NUM
million NUM


In [8]:
nlp.pipeline

[('tagger', <spacy.pipeline.pipes.Tagger at 0x7ff092059f60>),
 ('parser', <spacy.pipeline.pipes.DependencyParser at 0x7ff09158bac8>),
 ('ner', <spacy.pipeline.pipes.EntityRecognizer at 0x7ff09158bb28>)]

In [9]:
nlp.pipe_names

['tagger', 'parser', 'ner']

In [11]:
type(doc)

spacy.tokens.doc.Doc

In [14]:
for t in doc:
    print (t, t.pos_, t.dep_)

Tesla PROPN nsubj
is VERB aux
looking VERB ROOT
at ADP prep
buying VERB pcomp
U.S. PROPN compound
Startup PROPN dobj
for ADP prep
$ SYM quantmod
6 NUM compound
million NUM pobj


In [15]:
string = '"We\'re moving to L.A."'

In [16]:
print (string)

"We're moving to L.A."


In [17]:
doc2 = nlp(string)

In [18]:
doc2

"We're moving to L.A."

In [22]:
for t in doc2:
    print (f"Token: {t}\t POS: {t.pos_}")

Token: "	 POS: PUNCT
Token: We	 POS: PRON
Token: 're	 POS: VERB
Token: moving	 POS: VERB
Token: to	 POS: ADP
Token: L.A.	 POS: PROPN
Token: "	 POS: PUNCT


In [24]:
doc3 = nlp (u"We're here to help! send snail-mail, email support@oursite.com or visit www.oursite.com!")

In [27]:
for t in doc3:
    print (f"Token:{t}\t POS: {t.pos_}")

Token:We	 POS: PRON
Token:'re	 POS: VERB
Token:here	 POS: ADV
Token:to	 POS: PART
Token:help	 POS: VERB
Token:!	 POS: PUNCT
Token:send	 POS: VERB
Token:snail	 POS: NOUN
Token:-	 POS: PUNCT
Token:mail	 POS: NOUN
Token:,	 POS: PUNCT
Token:email	 POS: NOUN
Token:support@oursite.com	 POS: X
Token:or	 POS: CCONJ
Token:visit	 POS: VERB
Token:www.oursite.com	 POS: X
Token:!	 POS: PUNCT


In [30]:
doc4 = nlp (u"A 5km NewDelhi cab ride would cost around $2.10")

In [31]:
for t in doc4:
    print(f"Token: {t}\tPOS: {t.pos_}")

Token: A	POS: DET
Token: 5	POS: NUM
Token: km	POS: NOUN
Token: NewDelhi	POS: PROPN
Token: cab	POS: NOUN
Token: ride	POS: NOUN
Token: would	POS: VERB
Token: cost	POS: VERB
Token: around	POS: ADP
Token: $	POS: SYM
Token: 2.10	POS: NUM


In [32]:
# Extracting out entities

In [55]:
doc5 = nlp(u"New Delhi is the capital of India. Narendra Modi is the Prime Minister of India.")

In [56]:
for named_entity in doc5.ents:
    print (named_entity)
    print (named_entity.label_)
    print (str(spacy.explain(named_entity.label_)))
    print('\n')

New Delhi
GPE
Countries, cities, states


India
GPE
Countries, cities, states


Narendra Modi
PERSON
People, including fictional


India
GPE
Countries, cities, states




In [58]:
## Visualisations in spacy

In [59]:
from spacy import displacy

In [74]:
displacy.render (doc5,style='dep', jupyter=True,options={'distance': 70,'color': '#00ff00', 'bg': 'black'})

In [76]:
displacy.render (doc5,style='ent', jupyter=True,options={'distance': 70,'color': '#00ff00', 'bg': 'black'})