In [1]:
import spacy

In [2]:
nlp = spacy.load(r'en_core_web_sm')

In [3]:
doc = nlp(u'Tesla is looking at U.S.S.R for buying $6 million worth of cost')

In [4]:
for token in doc:
  print(f'{token.text:20} {token.pos:1} {token.pos_:15}  {token.dep_}')  

Tesla                96 PROPN            nsubj
is                   87 AUX              aux
looking              100 VERB             ROOT
at                   85 ADP              prep
U.S.S.R              96 PROPN            pobj
for                  85 ADP              prep
buying               100 VERB             pcomp
$                    99 SYM              quantmod
6                    93 NUM              compound
million              93 NUM              nummod
worth                92 NOUN             dobj
of                   85 ADP              prep
cost                 92 NOUN             pobj


In [5]:
nlp.pipeline

[('tok2vec', <spacy.pipeline.tok2vec.Tok2Vec at 0x2329f288450>),
 ('tagger', <spacy.pipeline.tagger.Tagger at 0x2329f2def90>),
 ('parser', <spacy.pipeline.dep_parser.DependencyParser at 0x2329f2da160>),
 ('ner', <spacy.pipeline.ner.EntityRecognizer at 0x2329f0e5ac0>),
 ('attribute_ruler',
  <spacy.pipeline.attributeruler.AttributeRuler at 0x2329f2813c0>),
 ('lemmatizer', <spacy.lang.en.lemmatizer.EnglishLemmatizer at 0x2329f2740c0>)]

In [6]:
nlp.pipe_names

['tok2vec', 'tagger', 'parser', 'ner', 'attribute_ruler', 'lemmatizer']

In [7]:
doc2 = nlp(u"I got kishmish      from my mom but my sister didn't.")

In [8]:
for token in doc2:
   print(f'{token.text:20} {token.pos_:15}  {token.dep_}')  

I                    PRON             nsubj
got                  VERB             ROOT
kishmish             ADJ              amod
                     SPACE            dobj
from                 ADP              prep
my                   PRON             poss
mom                  NOUN             pobj
but                  CCONJ            cc
my                   PRON             poss
sister               NOUN             nsubj
did                  VERB             conj
n't                  PART             neg
.                    PUNCT            punct


In [9]:
doc3 = nlp(u'Gaius Julius Caesar was born into a patrician family, the gens Julia, which claimed descent from Julus, son of the legendary Trojan prince Aeneas, supposedly the son of the goddess Venus. 6 The Julii were of Alban origin, mentioned as one of the leading Alban houses, which settled in Rome around the mid-7th century BC, following the destruction of Alba Longa. They were granted patrician status, along with other noble Alban families.')

In [10]:
julius = doc3[17:34]
print(julius)

from Julus, son of the legendary Trojan prince Aeneas, supposedly the son of the goddess


In [11]:
type(julius)

spacy.tokens.span.Span

In [12]:
type(doc3)

spacy.tokens.doc.Doc

In [13]:
doc4 = nlp(u"This is the first sentence. This is another sentence. This is last statement.")

In [14]:
for sentence in doc4.sents:
    print(sentence)

This is the first sentence.
This is another sentence.
This is last statement.


In [15]:
doc4[6].is_sent_start

True

In [16]:
doc4[8].is_sent_start

False