In [2]:
import spacy

In [3]:
nlp = spacy.load('en_core_web_sm') # loading english model

In [4]:
text = "Apple is the first U.S. public company reaching a $1 trillion market value."

In [5]:
doc = nlp(text)

In [6]:
doc

Apple is the first U.S. public company reaching a $1 trillion market value.

In [7]:
type(doc)

spacy.tokens.doc.Doc

In [8]:
for d in doc:
    print(d)

Apple
is
the
first
U.S.
public
company
reaching
a
$
1
trillion
market
value
.


In [9]:
doc[0].text

'Apple'

In [10]:
doc[0].pos_ # POS: Part of speech

'PROPN'

In [11]:
doc[0].dep_ # syntactic dependencies

'nsubj'

In [12]:
doc[0].lemma_

'Apple'

In [18]:
 for token in doc:
     # Get the token text, part-of-speech tag and dependency label
    token_text = token.text
    token_pos= token.pos_
    token_dep = token.dep_
    token_lemma = token.lemma_
    # This is for formatting only
    print(f"{token_text:<12}{token_pos:<10}{token_dep:<10}{token_lemma:<10}")  

Apple       PROPN     nsubj     Apple     
is          AUX       ROOT      be        
the         DET       det       the       
first       ADJ       amod      first     
U.S.        PROPN     nmod      U.S.      
public      ADJ       amod      public    
company     NOUN      attr      company   
reaching    VERB      acl       reach     
a           DET       det       a         
$           SYM       quantmod  $         
1           NUM       compound  1         
trillion    NUM       nummod    trillion  
market      NOUN      compound  market    
value       NOUN      dobj      value     
.           PUNCT     punct     .         


In [56]:
nlp.pipeline

[('tok2vec', <spacy.pipeline.tok2vec.Tok2Vec at 0x1ea0939f270>),
 ('tagger', <spacy.pipeline.tagger.Tagger at 0x1ea09495a40>),
 ('parser', <spacy.pipeline.dep_parser.DependencyParser at 0x1ea08f60b20>),
 ('attribute_ruler',
  <spacy.pipeline.attributeruler.AttributeRuler at 0x1ea08f8c7c0>),
 ('lemmatizer', <spacy.lang.en.lemmatizer.EnglishLemmatizer at 0x1ea0901b140>),
 ('ner', <spacy.pipeline.ner.EntityRecognizer at 0x1ea08f60940>)]

In [57]:
doc2 = nlp("Google isn't looking into startups.")

In [59]:
for token in doc2:
    print(f"{token.text:<12}{token.pos_:<10}{token.dep_:<10}") 

Google      PROPN     nsubj     
is          AUX       aux       
n't         PART      neg       
looking     VERB      ROOT      
into        ADP       prep      
startups    NOUN      pobj      
.           PUNCT     punct     


In [60]:
spacy.explain('PROPN')

'proper noun'

In [61]:
spacy.explain('AUX')

'auxiliary'