In [1]:
from nltk.tokenize import word_tokenize
from nltk.tag import pos_tag

##  Parts of speech in the English language


There are eight parts of speech in the English language:

`noun, pronoun, verb,
adjective, adverb, preposition,
conjunction, and interjection`


https://www.grammarly.com/blog/parts-of-speech/?gclid=Cj0KCQjwxb2XBhDBARIsAOjDZ36Tsx7Pz7dqIG-DgN2KLbLlwC1bdJEXj6gTZCpErz0sL2scaH0r67caAjneEALw_wcB&gclsrc=aw.ds


In [2]:
true_labels = '''

I went to work         (work -- noun). 
I work in the garden   (work -- verb).

'''

test = '''

I went to work. 
I work in the garden.

'''

In [17]:
words = word_tokenize(test)
words

['I', 'went', 'to', 'work', '.', 'I', 'work', 'in', 'the', 'garden', '.']

In [18]:
pos_tag(words)

[('I', 'PRP'),
 ('went', 'VBD'),
 ('to', 'TO'),
 ('work', 'VB'),
 ('.', '.'),
 ('I', 'PRP'),
 ('work', 'VBP'),
 ('in', 'IN'),
 ('the', 'DT'),
 ('garden', 'NN'),
 ('.', '.')]

## POS tag list:
`
CC coordinating conjunction
CD cardinal digit
DT determiner
EX existential there (like: "there is" ... think of it like "there exists")
FW foreign word
IN preposition/subordinating conjunction
JJ adjective 'big'
JJR adjective, comparative 'bigger'
JJS adjective, superlative 'biggest'
LS list marker 1)
MD modal could, will
NN noun, singular 'desk'
NNS noun plural 'desks'
NNP proper noun, singular 'Harrison'
NNPS proper noun, plural 'Americans'
PDT predeterminer 'all the kids'
POS possessive ending parent's
PRP personal pronoun I, he, she
PRP$ possessive pronoun my, his, hers
RB adverb very, silently,
RBR adverb, comparative better
RBS adverb, superlative best
RP particle give up
TO to go 'to' the store.
UH interjection errrrrrrrm
VB verb, base form take
VBD verb, past tense took
VBG verb, gerund/present participle taking
VBN verb, past participle taken
VBP verb, sing. present, non-3d take
VBZ verb, 3rd person sing. present takes
WDT wh-determiner which
WP wh-pronoun who, what
WP$ possessive wh-pronoun whose
WRB wh-abverb where, when`

## Example 2

In [4]:
true_labels = '''

She paints very well              (well -- adverb).
He’s well-liked in his community  (well -- adjective).
I dropped a penny in the well     (well -- noun).

'''

test = '''

She paints very well.
He’s well-liked in his community.
I dropped a penny in the well.

'''

In [5]:
words = word_tokenize(test)
words

['She',
 'paints',
 'very',
 'well',
 '.',
 'He',
 '’',
 's',
 'well-liked',
 'in',
 'his',
 'community',
 '.',
 'I',
 'dropped',
 'a',
 'penny',
 'in',
 'the',
 'well',
 '.']

In [6]:
pos_tag(words)

[('She', 'PRP'),
 ('paints', 'VBZ'),
 ('very', 'RB'),
 ('well', 'RB'),
 ('.', '.'),
 ('He', 'PRP'),
 ('’', 'VBD'),
 ('s', 'JJ'),
 ('well-liked', 'JJ'),
 ('in', 'IN'),
 ('his', 'PRP$'),
 ('community', 'NN'),
 ('.', '.'),
 ('I', 'PRP'),
 ('dropped', 'VBD'),
 ('a', 'DT'),
 ('penny', 'NN'),
 ('in', 'IN'),
 ('the', 'DT'),
 ('well', 'NN'),
 ('.', '.')]

## Example 3

In [7]:
true_labels = '''

I cooked breakfast and lunch, but Steve cooked dinner   (but -- conjunction).
I brought everything but the pens you asked for         (but -- preposition).

'''

test = '''

I cooked breakfast and lunch, but Steve cooked dinner.
I brought everything but the pens you asked for.

'''

In [8]:
words = word_tokenize(test)
words

['I',
 'cooked',
 'breakfast',
 'and',
 'lunch',
 ',',
 'but',
 'Steve',
 'cooked',
 'dinner',
 '.',
 'I',
 'brought',
 'everything',
 'but',
 'the',
 'pens',
 'you',
 'asked',
 'for',
 '.']

In [9]:
pos_tag(words)

[('I', 'PRP'),
 ('cooked', 'VBD'),
 ('breakfast', 'NN'),
 ('and', 'CC'),
 ('lunch', 'NN'),
 (',', ','),
 ('but', 'CC'),
 ('Steve', 'NNP'),
 ('cooked', 'VBD'),
 ('dinner', 'NN'),
 ('.', '.'),
 ('I', 'PRP'),
 ('brought', 'VBD'),
 ('everything', 'NN'),
 ('but', 'CC'),
 ('the', 'DT'),
 ('pens', 'NNS'),
 ('you', 'PRP'),
 ('asked', 'VBD'),
 ('for', 'IN'),
 ('.', '.')]