In [1]:
# Import spaCy and load the language library
import spacy
nlp = spacy.load('en_core_web_sm')

# Create a Doc object
doc = nlp(u'Tesla is looking at buying U.S. startup for $6 million')

# Print each token separately
for token in doc:
    print(token.text, token.pos_, token.dep_)

Tesla PROPN nsubj
is AUX aux
looking VERB ROOT
at ADP prep
buying VERB pcomp
U.S. PROPN compound
startup NOUN dobj
for ADP prep
$ SYM quantmod
6 NUM compound
million NUM pobj


In [2]:
nlp.pipeline

[('tagger', <spacy.pipeline.pipes.Tagger at 0x7fe81a2ea190>),
 ('parser', <spacy.pipeline.pipes.DependencyParser at 0x7fe81a252160>),
 ('ner', <spacy.pipeline.pipes.EntityRecognizer at 0x7fe81a252220>)]

In [3]:
doc2 = nlp(u"Tesla isn't   looking into startups anymore.")
for token in doc2:
    print(token.text, token.pos_, token.dep_)

Tesla PROPN nsubj
is AUX aux
n't PART neg
   SPACE 
looking VERB ROOT
into ADP prep
startups NOUN pobj
anymore ADV advmod
. PUNCT punct


In [4]:
doc2

Tesla isn't   looking into startups anymore.

In [5]:
doc2[0]

Tesla

In [6]:
doc2[0].pos_

'PROPN'

In [7]:
doc2[0].dep_

'nsubj'

In [8]:
doc2[4]

looking

In [9]:
doc2[4].text

'looking'

In [10]:
doc2[4].lemma_

'look'

In [11]:
doc2[4].pos_

'VERB'

In [16]:
# Simple Parts-of-Speech & Detailed Tags:
print(doc2[4].pos_)
print(doc2[4].tag_ + ' / ' + spacy.explain(doc2[4].tag_))

VERB
VBG / verb, gerund or present participle


In [17]:
# Word Shapes:
print(doc2[0].text+': '+doc2[0].shape_)
print(doc[5].text+' : '+doc[5].shape_)

Tesla: Xxxxx
U.S. : X.X.


In [18]:
# Boolean Values:
print(doc2[0].is_alpha)
print(doc2[0].is_stop)

True
False


In [19]:
doc3 = nlp(u'Although commmonly attributed to John Lennon from his song "Beautiful Boy", \
the phrase "Life is what happens to us while we are making other plans" was written by \
cartoonist Allen Saunders and published in Reader\'s Digest in 1957, when Lennon was 17.')

In [20]:
life_quote = doc3[16:30]
print(life_quote)

"Life is what happens to us while we are making other plans"


In [21]:
type(life_quote)

spacy.tokens.span.Span

In [22]:
doc4 = nlp(u'This is the first sentence. This is another sentence. This is the last sentence.')

In [23]:
for sent in doc4.sents:
    print(sent)

This is the first sentence.
This is another sentence.
This is the last sentence.


In [24]:
doc4[6]

This

In [25]:
doc4[6].is_sent_start

True