In [1]:
import spacy

In [2]:
nlp = spacy.load('en_core_web_sm')

In [10]:
nlp.pipe_names

['tok2vec', 'tagger', 'parser', 'attribute_ruler', 'lemmatizer', 'ner']

In [9]:
doc = nlp("Elon flew to Mars yesterday. He carried biryani masala with him")

for token in doc:
    print(token,'|', token.pos_,'|',token.pos,'|', spacy.explain(token.pos_))

Elon | PROPN | 96 | proper noun
flew | VERB | 100 | verb
to | ADP | 85 | adposition
Mars | PROPN | 96 | proper noun
yesterday | NOUN | 92 | noun
. | PUNCT | 97 | punctuation
He | PRON | 95 | pronoun
carried | VERB | 100 | verb
biryani | ADJ | 84 | adjective
masala | NOUN | 92 | noun
with | ADP | 85 | adposition
him | PRON | 95 | pronoun


In [14]:
doc = nlp("Wow! Dr. Strange made 265 million $ on the very first day")

for token in doc:
    print(token,'|', token.pos_,'|',token.pos,'|', spacy.explain(token.pos_),'|',token.tag_,'|',spacy.explain(token.tag_))

Wow | INTJ | 91 | interjection | UH | interjection
! | PUNCT | 97 | punctuation | . | punctuation mark, sentence closer
Dr. | PROPN | 96 | proper noun | NNP | noun, proper singular
Strange | PROPN | 96 | proper noun | NNP | noun, proper singular
made | VERB | 100 | verb | VBD | verb, past tense
265 | NUM | 93 | numeral | CD | cardinal number
million | NUM | 93 | numeral | CD | cardinal number
$ | NUM | 93 | numeral | CD | cardinal number
on | ADP | 85 | adposition | IN | conjunction, subordinating or preposition
the | DET | 90 | determiner | DT | determiner
very | ADV | 86 | adverb | RB | adverb
first | ADJ | 84 | adjective | JJ | adjective (English), other noun-modifier (Chinese)
day | NOUN | 92 | noun | NN | noun, singular or mass


### Spacy detects the tense 

In [15]:
doc = nlp('He quits the job')

print(doc[1].text, '|', doc[1].tag_, '|', spacy.explain(doc[1].tag_))

quits | VBZ | verb, 3rd person singular present


In [16]:
doc = nlp('He quit the job')

print(doc[1].text, '|', doc[1].tag_, '|', spacy.explain(doc[1].tag_))

quit | VBD | verb, past tense


In [28]:
text = "Microsoft Corporation is an American X multinational technology corporation headquartered in Redmond, Washington. It is also incorporated in Washington. Microsoft's best-known software products are the Windows line of operating systems, the Microsoft 365 suite of productivity applications, and the Edge web browser"

filetered_tokens = []

doc = nlp(text)
for token in doc:
    if token.pos_ in ["SPACE","X","PUNCT"]:
        filetered_tokens.append(token)
     
    print(token,'|', token.pos_,"|",spacy.explain(token.pos_))

Microsoft | PROPN | proper noun
Corporation | PROPN | proper noun
is | AUX | auxiliary
an | DET | determiner
American | PROPN | proper noun
X | PROPN | proper noun
multinational | ADJ | adjective
technology | NOUN | noun
corporation | NOUN | noun
headquartered | VERB | verb
in | ADP | adposition
Redmond | PROPN | proper noun
, | PUNCT | punctuation
Washington | PROPN | proper noun
. | PUNCT | punctuation
It | PRON | pronoun
is | AUX | auxiliary
also | ADV | adverb
incorporated | VERB | verb
in | ADP | adposition
Washington | PROPN | proper noun
. | PUNCT | punctuation
Microsoft | PROPN | proper noun
's | PART | particle
best | ADV | adverb
- | PUNCT | punctuation
known | VERB | verb
software | NOUN | noun
products | NOUN | noun
are | AUX | auxiliary
the | DET | determiner
Windows | PROPN | proper noun
line | NOUN | noun
of | ADP | adposition
operating | NOUN | noun
systems | NOUN | noun
, | PUNCT | punctuation
the | DET | determiner
Microsoft | PROPN | proper noun
365 | NUM | numeral
s

In [29]:
filetered_tokens

[,, ., ., -, ,, ,]

In [33]:
count = doc.count_by(spacy.attrs.POS)
count

{96: 11,
 87: 3,
 90: 4,
 84: 1,
 92: 12,
 100: 3,
 85: 4,
 97: 6,
 95: 1,
 86: 2,
 94: 1,
 93: 1,
 89: 1}

In [34]:
for k,v in count.items():
    print(doc.vocab[k].text,"|",v)    


PROPN | 11
AUX | 3
DET | 4
ADJ | 1
NOUN | 12
VERB | 3
ADP | 4
PUNCT | 6
PRON | 1
ADV | 2
PART | 1
NUM | 1
CCONJ | 1
