In [1]:
import spacy 

In [4]:
nlp=spacy.load('en_core_web_md')

text='''Special sequences make commonly used patterns easier to write. Here's a list of special sequences.
        The above code defines a RegEx pattern. The pattern is: any five letter string starting with a and ending with s.
        There are other several functions defined in the re module to work with RegEx. 
        Before we explore that, let's learn about regular expressions themselves. unnoticed'''

doc=nlp(text)

lemma = [(token.text,token.lemma_) for token in doc]

In [5]:
lemma

[('Special', 'special'),
 ('sequences', 'sequence'),
 ('make', 'make'),
 ('commonly', 'commonly'),
 ('used', 'use'),
 ('patterns', 'pattern'),
 ('easier', 'easy'),
 ('to', 'to'),
 ('write', 'write'),
 ('.', '.'),
 ('Here', 'here'),
 ("'s", 'be'),
 ('a', 'a'),
 ('list', 'list'),
 ('of', 'of'),
 ('special', 'special'),
 ('sequences', 'sequence'),
 ('.', '.'),
 ('\n        ', '\n        '),
 ('The', 'the'),
 ('above', 'above'),
 ('code', 'code'),
 ('defines', 'define'),
 ('a', 'a'),
 ('RegEx', 'RegEx'),
 ('pattern', 'pattern'),
 ('.', '.'),
 ('The', 'the'),
 ('pattern', 'pattern'),
 ('is', 'be'),
 (':', ':'),
 ('any', 'any'),
 ('five', 'five'),
 ('letter', 'letter'),
 ('string', 'string'),
 ('starting', 'start'),
 ('with', 'with'),
 ('a', 'a'),
 ('and', 'and'),
 ('ending', 'end'),
 ('with', 'with'),
 ('s.', 's.'),
 ('\n        ', '\n        '),
 ('There', 'there'),
 ('are', 'be'),
 ('other', 'other'),
 ('several', 'several'),
 ('functions', 'function'),
 ('defined', 'define'),
 ('in', 'in

##### POS Tagging

In [17]:
pos=[(token.text,token.pos_,spacy.explain(token.pos_)) for token in doc]

In [18]:
pos

[('Special', 'ADJ', 'adjective'),
 ('sequences', 'NOUN', 'noun'),
 ('make', 'VERB', 'verb'),
 ('commonly', 'ADV', 'adverb'),
 ('used', 'VERB', 'verb'),
 ('patterns', 'NOUN', 'noun'),
 ('easier', 'ADJ', 'adjective'),
 ('to', 'PART', 'particle'),
 ('write', 'VERB', 'verb'),
 ('.', 'PUNCT', 'punctuation'),
 ('Here', 'ADV', 'adverb'),
 ("'s", 'AUX', 'auxiliary'),
 ('a', 'DET', 'determiner'),
 ('list', 'NOUN', 'noun'),
 ('of', 'ADP', 'adposition'),
 ('special', 'ADJ', 'adjective'),
 ('sequences', 'NOUN', 'noun'),
 ('.', 'PUNCT', 'punctuation'),
 ('\n        ', 'SPACE', 'space'),
 ('The', 'DET', 'determiner'),
 ('above', 'ADJ', 'adjective'),
 ('code', 'NOUN', 'noun'),
 ('defines', 'VERB', 'verb'),
 ('a', 'DET', 'determiner'),
 ('RegEx', 'PROPN', 'proper noun'),
 ('pattern', 'NOUN', 'noun'),
 ('.', 'PUNCT', 'punctuation'),
 ('The', 'DET', 'determiner'),
 ('pattern', 'NOUN', 'noun'),
 ('is', 'AUX', 'auxiliary'),
 (':', 'PUNCT', 'punctuation'),
 ('any', 'DET', 'determiner'),
 ('five', 'NUM', 'n

##### NER

In [19]:
[(ent.text,ent.start_char,ent.end_char,ent.label_) for ent in doc.ents]

[('five', 167, 171, 'CARDINAL')]

In [20]:
sentences=[sent for sent in doc.sents]

In [21]:
sentences

[Special sequences make commonly used patterns easier to write.,
 Here's a list of special sequences.
         ,
 The above code defines a RegEx pattern.,
 The pattern is: any five letter string starting with a and ending with s.
         There are other several functions defined in the re module to work with RegEx. 
         ,
 Before we explore that, let's learn about regular expressions themselves.]

In [22]:
for sent in sentences:
    print([(ent.text,ent.start_char,ent.end_char,ent.label_) for ent in sent.ents])

[]
[]
[]
[('five', 167, 171, 'CARDINAL')]
[]


In [23]:
print([(token.text,token.ent_type_) for token in doc])

[('Special', ''), ('sequences', ''), ('make', ''), ('commonly', ''), ('used', ''), ('patterns', ''), ('easier', ''), ('to', ''), ('write', ''), ('.', ''), ('Here', ''), ("'s", ''), ('a', ''), ('list', ''), ('of', ''), ('special', ''), ('sequences', ''), ('.', ''), ('\n        ', ''), ('The', ''), ('above', ''), ('code', ''), ('defines', ''), ('a', ''), ('RegEx', ''), ('pattern', ''), ('.', ''), ('The', ''), ('pattern', ''), ('is', ''), (':', ''), ('any', ''), ('five', 'CARDINAL'), ('letter', ''), ('string', ''), ('starting', ''), ('with', ''), ('a', ''), ('and', ''), ('ending', ''), ('with', ''), ('s.', ''), ('\n        ', ''), ('There', ''), ('are', ''), ('other', ''), ('several', ''), ('functions', ''), ('defined', ''), ('in', ''), ('the', ''), ('re', ''), ('module', ''), ('to', ''), ('work', ''), ('with', ''), ('RegEx', ''), ('.', ''), ('\n        ', ''), ('Before', ''), ('we', ''), ('explore', ''), ('that', ''), (',', ''), ('let', ''), ("'s", ''), ('learn', ''), ('about', ''), ('re

In [24]:
text1="I watch movie. I wear a watch everday"

doc=nlp(text1)

print([(token.text,token.pos_,spacy.explain(token.pos_)) for token in doc])

[('I', 'PRON', 'pronoun'), ('watch', 'VERB', 'verb'), ('movie', 'NOUN', 'noun'), ('.', 'PUNCT', 'punctuation'), ('I', 'PRON', 'pronoun'), ('wear', 'VERB', 'verb'), ('a', 'DET', 'determiner'), ('watch', 'NOUN', 'noun'), ('everday', 'NOUN', 'noun')]
