In [23]:
# Parts of Speech Tagging

# CC - Coordinating Conjunction
# CD - Cardinal Number
# DT - Determiner
# EX - Existential There
# FW - Foreign Word
# IN - Preposition or subordinating conjunction
# JJ - Adjective
# JJR - Adjective, Comparative  
# JJS - Adjective, Superlative
# LS - List Item Marker
# MD - Modal
# NN - Noun, Singular or Mass
# NNS - Noun, Plural
# NNP - Proper Noun, Singular
# NNPS - Proper Noun, Plural
# PDT - Predeterminer
# POS - Possessive Ending
# PRP - Personal Pronoun
# PRP$ - Possessive Pronoun
# RB - Adverb
# RBR - Adverb, Comparative
# RBS - Adverb, Superlative
# RP - Particle
# SYM - Symbol
# TO - to
# UH - Interjection
# VB - Verb, Base Form
# VBD - Verb, Past Tense
# VBG - Verb, Gerund or Present Participle
# VBN - Verb, Past Participle
# VBP - Verb, Non-3rd Person Singular Present
# VBZ - Verb, 3rd Person Singular Present
# WDT - Wh-Determiner
# WP - Wh-Pronoun
# WRB - Wh-Adverb




In [24]:
str = "Taj Mahal is a beautiful place"

paragraph = """My dear brothers and sisters,
I stand here before you today with a heart full of gratitude and a deep sense of humility. As the President of this great nation, I have been privileged to witness the remarkable progress and transformation that India has undergone in recent years. But this progress, my friends, is not the work of one person or one government. It is the result of the collective efforts and aspirations of over a billion Indians, each of whom has contributed in their own way to the growth and development of our beloved country.
When I look around, I see a nation brimming with energy, optimism, and a renewed sense of purpose. Our economy is growing at a rapid pace, lifting millions out of poverty and ushering in a new era of prosperity. Our scientific and technological achievements are the envy of the world, as we push the boundaries of human knowledge and innovation. And our rich cultural heritage, embodied in our languages, arts, and traditions, continues to inspire and captivate people across the globe.
But my friends, as we celebrate our successes, we must also acknowledge the challenges that lie ahead. Poverty, illiteracy, and inequality are still prevalent in many parts of our country. Our environment is under threat, and we must act quickly to preserve the delicate balance of our ecosystems. And with the advent of new technologies and global interconnectedness, we face the daunting task of ensuring that the benefits of progress are shared equitably among all our citizens.
Yet, I remain confident that we, the people of India, have the resilience, the ingenuity, and the determination to overcome these obstacles. For we have done it before, time and time again. We have stood united in the face of adversity, drawing strength from our diversity and our shared vision of a better future.
My fellow citizens, I believe that the time has come for us to dream big, to set our sights on lofty goals, and to work tirelessly towards their realization. Let us not be content with the status quo, but rather strive to create a India that is a beacon of hope and inspiration for the rest of the world.
Together, let us build a nation where every child has access to quality education and healthcare, where every family has a roof over their head and food on the table, where every individual is empowered to reach their full potential. Let us create a society that is just, equitable, and inclusive, where the fruits of our collective labor are shared equally among all.
And as we embark on this journey, let us remember the timeless words of our great leader, Mahatma Gandhi, who said, "Be the change you wish to see in the world." Each and every one of us has a role to play, a responsibility to fulfill, in shaping the future of our nation.
My friends, the path ahead may not be easy, but it is one that is filled with hope and promise. Let us face it with courage, determination, and a unwavering commitment to the ideals that have always defined us as a people – the ideals of unity, of compassion, and of service to our fellow citizens.
In closing, I would like to leave you with a quote that has always inspired me, from the ancient Indian text, the Bhagavad Gita: "Yoga is the journey of the self, through the self, to the self." May we all embark on this journey, and may the light of our collective wisdom and determination guide us towards a future that is brighter and more prosperous for all.
Thank you, and may God bless you all.
"""

In [31]:
import nltk
nltk.download('punkt')
nltk.download('stopwords')
nltk.download('averaged_perceptron_tagger_eng')
from nltk.tokenize import PunktSentenceTokenizer, WordPunctTokenizer
from nltk import pos_tag
from nltk.tokenize import word_tokenize

[nltk_data] Downloading package punkt to
[nltk_data]     /Users/saumyagupta/nltk_data...
[nltk_data]   Package punkt is already up-to-date!
[nltk_data] Downloading package stopwords to
[nltk_data]     /Users/saumyagupta/nltk_data...
[nltk_data]   Package stopwords is already up-to-date!
[nltk_data] Downloading package averaged_perceptron_tagger_eng to
[nltk_data]     /Users/saumyagupta/nltk_data...
[nltk_data]   Unzipping taggers/averaged_perceptron_tagger_eng.zip.


In [32]:
tokenizer = PunktSentenceTokenizer(paragraph)
sentences = tokenizer.tokenize(paragraph)
sentences

['My dear brothers and sisters,\nI stand here before you today with a heart full of gratitude and a deep sense of humility.',
 'As the President of this great nation, I have been privileged to witness the remarkable progress and transformation that India has undergone in recent years.',
 'But this progress, my friends, is not the work of one person or one government.',
 'It is the result of the collective efforts and aspirations of over a billion Indians, each of whom has contributed in their own way to the growth and development of our beloved country.',
 'When I look around, I see a nation brimming with energy, optimism, and a renewed sense of purpose.',
 'Our economy is growing at a rapid pace, lifting millions out of poverty and ushering in a new era of prosperity.',
 'Our scientific and technological achievements are the envy of the world, as we push the boundaries of human knowledge and innovation.',
 'And our rich cultural heritage, embodied in our languages, arts, and tradition

In [33]:
#Find out parts of speech of words in each sentence
from nltk.corpus import stopwords
stop_words = set(stopwords.words('english'))
for i in range(len(sentences)):
    words = WordPunctTokenizer().tokenize(sentences[i])
    words = [word for word in words if word not in stop_words]
    tags = pos_tag(words)
    print(tags)

[('My', 'PRP$'), ('dear', 'JJ'), ('brothers', 'NNS'), ('sisters', 'NNS'), (',', ','), ('I', 'PRP'), ('stand', 'VBP'), ('today', 'NN'), ('heart', 'NN'), ('full', 'JJ'), ('gratitude', 'NN'), ('deep', 'JJ'), ('sense', 'NN'), ('humility', 'NN'), ('.', '.')]
[('As', 'IN'), ('President', 'NNP'), ('great', 'JJ'), ('nation', 'NN'), (',', ','), ('I', 'PRP'), ('privileged', 'VBD'), ('witness', 'RBR'), ('remarkable', 'JJ'), ('progress', 'NN'), ('transformation', 'NN'), ('India', 'NNP'), ('undergone', 'JJ'), ('recent', 'JJ'), ('years', 'NNS'), ('.', '.')]
[('But', 'CC'), ('progress', 'NN'), (',', ','), ('friends', 'NNS'), (',', ','), ('work', 'VBP'), ('one', 'CD'), ('person', 'NN'), ('one', 'CD'), ('government', 'NN'), ('.', '.')]
[('It', 'PRP'), ('result', 'VBZ'), ('collective', 'JJ'), ('efforts', 'NNS'), ('aspirations', 'NNS'), ('billion', 'CD'), ('Indians', 'NNPS'), (',', ','), ('contributed', 'VBD'), ('way', 'NN'), ('growth', 'NN'), ('development', 'NN'), ('beloved', 'VBD'), ('country', 'NN'),

In [35]:
pos_tag(str.split())

[('Taj', 'NNP'),
 ('Mahal', 'NNP'),
 ('is', 'VBZ'),
 ('a', 'DT'),
 ('beautiful', 'JJ'),
 ('place', 'NN')]