In [1]:
import spacy

In [2]:
# Loading the Language Library / Loading a Model, and we called it nlp
nlp = spacy.load('en_core_web_sm')  # Core English Language, Small Version of this language library

In [3]:
doc = nlp(u'Tesla is looking at buying U.S. startup for $6 million') # u, is passing a UniCode String
# The Language library is going to parse this entire string to seperate components, its gonna parse it into something called tokens, each of the word will be a token 

In [4]:
for token in doc:
    print(token.text)

Tesla
is
looking
at
buying
U.S.
startup
for
$
6
million


In [8]:
for token in doc:
    print(token.text,"| ", token.pos_, "| ",token.dep_) #pos , Part of Speech | dep, Syntactic dependency

Tesla |  PROPN |  nsubj
is |  VERB |  aux
looking |  VERB |  ROOT
at |  ADP |  prep
buying |  VERB |  pcomp
U.S. |  PROPN |  compound
startup |  NOUN |  dobj
for |  ADP |  prep
$ |  SYM |  quantmod
6 |  NUM |  compound
million |  NUM |  pobj


In [9]:
nlp.pipeline

[('tagger', <spacy.pipeline.Tagger at 0x1f05326ea08>),
 ('parser', <spacy.pipeline.DependencyParser at 0x1f05325fa08>),
 ('ner', <spacy.pipeline.EntityRecognizer at 0x1f05325ffa8>)]

In [10]:
nlp.pipe_names

['tagger', 'parser', 'ner']

In [11]:
doc2 = nlp(u"Tesla isn't looking into startups anymore.")

In [12]:
for token in doc2:
    print(token.text,"| ", token.pos_, "| ",token.dep_) #pos , Part of Speech | dep, Syntactic dependency

Tesla |  PROPN |  nsubj
is |  VERB |  aux
n't |  ADV |  neg
looking |  VERB |  ROOT
into |  ADP |  prep
startups |  NOUN |  pobj
anymore |  ADV |  advmod
. |  PUNCT |  punct


In [13]:
doc2[0]

Tesla

In [14]:
doc2[0].pos_

'PROPN'

#### Span

In [15]:
doc3 = nlp(u'Although commmonly attributed to John Lennon from his song "Beautiful Boy", \
the phrase "Life is what happens to us while we are making other plans" was written by \
cartoonist Allen Saunders and published in Reader\'s Digest in 1957, when Lennon was 17.')

In [16]:
life_quote = doc3[16:30]
print(life_quote)

"Life is what happens to us while we are making other plans"


In [17]:
type(life_quote)

spacy.tokens.span.Span

In [18]:
type(doc3)

spacy.tokens.doc.Doc

In [19]:
doc4 = nlp(u"This is the first sentence. This is another sentence. This is the last sentence")

In [20]:
for sentence in doc4.sents:
    print(sentence)

This is the first sentence.
This is another sentence.
This is the last sentence


In [21]:
doc4[6]

This

In [22]:
doc4[6].is_sent_start

True