In [49]:
paragraph="""Blockchain technology has emerged as a revolutionary force in the realm of digital transactions and financial systems, offering a decentralized and secure method for transferring value and verifying transactions. This essay delves into the intricacies of blockchain technology, exploring its workings, implications, and potential future developments.Understanding Blockchain Technology:  At its core, blockchain technology operates as a distributed ledger, a database that records transactions across multiple computers in a network. Each transaction is recorded in a block, and once added to the chain, it becomes immutable. This structure ensures transparency, security, and decentralization, as no single entity controls the entire network. Cryptocurrencies like Bitcoin are built upon this technology, leveraging it to enable peer-to-peer transactions without the need for intermediaries such as banks or governments 3.
The Double-Spend Problem and Its Solution: A significant challenge in digital currencies is the double-spend problem, where a digital unit of currency can be duplicated and spent more than once. Traditional solutions involve a trusted third party to verify transactions, but blockchain technology solves this problem through a consensus mechanism among network participants. Miners, who validate transactions, are rewarded with cryptocurrency, creating a self-regulating ecosystem that prevents fraudulent activities """

In [50]:
from nltk.stem import PorterStemmer

In [51]:
from nltk.corpus import stopwords

In [52]:
import nltk
nltk.download('stopwords')

[nltk_data] Downloading package stopwords to
[nltk_data]     /Users/udaykiran/nltk_data...
[nltk_data]   Package stopwords is already up-to-date!


True

In [53]:
stopwords.words('english')

['i',
 'me',
 'my',
 'myself',
 'we',
 'our',
 'ours',
 'ourselves',
 'you',
 "you're",
 "you've",
 "you'll",
 "you'd",
 'your',
 'yours',
 'yourself',
 'yourselves',
 'he',
 'him',
 'his',
 'himself',
 'she',
 "she's",
 'her',
 'hers',
 'herself',
 'it',
 "it's",
 'its',
 'itself',
 'they',
 'them',
 'their',
 'theirs',
 'themselves',
 'what',
 'which',
 'who',
 'whom',
 'this',
 'that',
 "that'll",
 'these',
 'those',
 'am',
 'is',
 'are',
 'was',
 'were',
 'be',
 'been',
 'being',
 'have',
 'has',
 'had',
 'having',
 'do',
 'does',
 'did',
 'doing',
 'a',
 'an',
 'the',
 'and',
 'but',
 'if',
 'or',
 'because',
 'as',
 'until',
 'while',
 'of',
 'at',
 'by',
 'for',
 'with',
 'about',
 'against',
 'between',
 'into',
 'through',
 'during',
 'before',
 'after',
 'above',
 'below',
 'to',
 'from',
 'up',
 'down',
 'in',
 'out',
 'on',
 'off',
 'over',
 'under',
 'again',
 'further',
 'then',
 'once',
 'here',
 'there',
 'when',
 'where',
 'why',
 'how',
 'all',
 'any',
 'both',
 'each

In [54]:
stopwords.words('french')

['au',
 'aux',
 'avec',
 'ce',
 'ces',
 'dans',
 'de',
 'des',
 'du',
 'elle',
 'en',
 'et',
 'eux',
 'il',
 'ils',
 'je',
 'la',
 'le',
 'les',
 'leur',
 'lui',
 'ma',
 'mais',
 'me',
 'même',
 'mes',
 'moi',
 'mon',
 'ne',
 'nos',
 'notre',
 'nous',
 'on',
 'ou',
 'par',
 'pas',
 'pour',
 'qu',
 'que',
 'qui',
 'sa',
 'se',
 'ses',
 'son',
 'sur',
 'ta',
 'te',
 'tes',
 'toi',
 'ton',
 'tu',
 'un',
 'une',
 'vos',
 'votre',
 'vous',
 'c',
 'd',
 'j',
 'l',
 'à',
 'm',
 'n',
 's',
 't',
 'y',
 'été',
 'étée',
 'étées',
 'étés',
 'étant',
 'étante',
 'étants',
 'étantes',
 'suis',
 'es',
 'est',
 'sommes',
 'êtes',
 'sont',
 'serai',
 'seras',
 'sera',
 'serons',
 'serez',
 'seront',
 'serais',
 'serait',
 'serions',
 'seriez',
 'seraient',
 'étais',
 'était',
 'étions',
 'étiez',
 'étaient',
 'fus',
 'fut',
 'fûmes',
 'fûtes',
 'furent',
 'sois',
 'soit',
 'soyons',
 'soyez',
 'soient',
 'fusse',
 'fusses',
 'fût',
 'fussions',
 'fussiez',
 'fussent',
 'ayant',
 'ayante',
 'ayantes',


In [55]:
from nltk.stem import PorterStemmer

In [56]:
stemmer=PorterStemmer()

In [75]:
sentences=nltk.sent_tokenize(paragraph) #take a paragraph divide into sentences

In [58]:
type(sentences)

list

In [59]:
print(sentences)

['Blockchain technology has emerged as a revolutionary force in the realm of digital transactions and financial systems, offering a decentralized and secure method for transferring value and verifying transactions.', 'This essay delves into the intricacies of blockchain technology, exploring its workings, implications, and potential future developments.Understanding Blockchain Technology:  At its core, blockchain technology operates as a distributed ledger, a database that records transactions across multiple computers in a network.', 'Each transaction is recorded in a block, and once added to the chain, it becomes immutable.', 'This structure ensures transparency, security, and decentralization, as no single entity controls the entire network.', 'Cryptocurrencies like Bitcoin are built upon this technology, leveraging it to enable peer-to-peer transactions without the need for intermediaries such as banks or governments 3.', 'The Double-Spend Problem and Its Solution: A significant ch

In [65]:
#Apply stopwords and filter and then apply stemming

for i in range(len(sentences)):
    words=nltk.word_tokenize(sentences[i])
    words=[stemmer.stem(word) for word in words if word not in set(stopwords.words('english'))]
    sentences[i]=''.join(words)#converting all the list of words into sentences 

In [66]:
sentences

['blockchaintechnologemergrevolutionariforcrealmdigittransactfinancisystem,offerdecentrsecurmethodtransfervaluverifitransact.',
 'thiessaydelvintricaciblockchaintechnolog,explorwork,implic,potentifuturdevelopments.understandblockchaintechnolog:atcor,blockchaintechnologoperdistributledg,databasrecordtransactacrossmultiplcomputnetwork.',
 'eachtransactrecordblock,adchain,becomimmut.',
 'thistructurensurtranspar,secur,decentr,singlentiticontrolentirnetwork.',
 'cryptocurrlikebitcoinbuiltupontechnolog,leveragenablpeer-to-ptransactwithoutneedintermediaribankgovern3.',
 'thedouble-spendproblemitsolut:asignificchallengdigitcurrencdouble-spendproblem,digitunitcurrencduplicsp.',
 'traditsolutinvolvtrustthirdpartiverifitransact,blockchaintechnologsolvproblemconsensumechanamongnetworkparticip.',
 'miner,validtransact,rewardcryptocurr,creatself-regulecosystempreventfraudulactiv']

In [67]:
from nltk.stem import SnowballStemmer
snowballstemmer=SnowballStemmer('english')

In [68]:
#Apply stopwords and filter and then apply snowball stemming

for i in range(len(sentences)):
    words=nltk.word_tokenize(sentences[i])
    words=[snowballstemmer.stem(word) for word in words if word not in set(stopwords.words('english'))]
    sentences[i]=''.join(words)#converting all the list of words into sentences 

In [69]:
sentences

['blockchaintechnologemergrevolutionariforcrealmdigittransactfinancisystem,offerdecentrsecurmethodtransfervaluverifitransact.',
 'thiessaydelvintricaciblockchaintechnolog,explorwork,implic,potentifuturdevelopments.understandblockchaintechnolog:atcor,blockchaintechnologoperdistributledg,databasrecordtransactacrossmultiplcomputnetwork.',
 'eachtransactrecordblock,adchain,becomimmut.',
 'thistructurensurtranspar,secur,decentr,singlentiticontrolentirnetwork.',
 'cryptocurrlikebitcoinbuiltupontechnolog,leveragenablpeer-to-ptransactwithoutneedintermediaribankgovern3.',
 'thedouble-spendproblemitsolut:asignificchallengdigitcurrencdouble-spendproblem,digitunitcurrencduplicsp.',
 'traditsolutinvolvtrustthirdpartiverifitransact,blockchaintechnologsolvproblemconsensumechanamongnetworkparticip.',
 'miner,validtransact,rewardcryptocurr,creatself-regulecosystempreventfraudulactiv']

In [73]:
from nltk.stem import WordNetLemmatizer
lemmatizer=WordNetLemmatizer()

In [79]:
#Apply stopwords and filter and then apply snowball stemming

for i in range(len(sentences)):
    words=nltk.word_tokenize(sentences[i])
    words=[lemmatizer.lemmatize(word,pos='v') for word in words if word not in set(stopwords.words('english'))]
    sentences[i]=''.join(words)#converting all the list of words into sentences 

In [80]:
sentences

['Blockchaintechnologyemergedrevolutionaryforcerealmdigitaltransactionfinancialsystem,offeringdecentralizedsecuremethodtransferringvalueverifyingtransaction.',
 'Thisessaydelfintricacyblockchaintechnology,exploringworking,implication,potentialfuturedevelopments.UnderstandingBlockchainTechnology:Atcore,blockchaintechnologyoperatesdistributedledger,databaserecordtransactionacrossmultiplecomputernetwork.',
 'Eachtransactionrecordedblock,addedchain,becomesimmutable.',
 'Thisstructureensurestransparency,security,decentralization,singleentitycontrolentirenetwork.',
 'CryptocurrencieslikeBitcoinbuiltupontechnology,leveragingenablepeer-to-peertransactionwithoutneedintermediarybankgovernment3.',
 'TheDouble-SpendProblemItsSolution:Asignificantchallengedigitalcurrencydouble-spendproblem,digitalunitcurrencyduplicatedspent.',
 'Traditionalsolutioninvolvetrustedthirdpartyverifytransaction,blockchaintechnologysolvesproblemconsensusmechanismamongnetworkparticipant.',
 'Miners,validatetransaction,rewa