# NLPAug

In [1]:
import nlpaug.augmenter.sentence as nas
import nlpaug.augmenter.word as naw

### ContextualWordEmbsAug

In [2]:
"""
    action = insert: a new word will be injected to random position according to contextual word embeddings calculation.
    action = substitute: word will be replaced according to contextual embeddings calculation
"""
aug = naw.ContextualWordEmbsAug(
model_path='bert-base-uncased', action="insert") 
aug = naw.ContextualWordEmbsAug(
    model_path='bert-base-uncased', action="substitute") 

text = 'The quick brown fox jumps over the lazy dog .'

augmented_text = aug.augment(text)
print("ORIGINAL TEXT: ", text)
print("AUGMENTED TEXT: ",augmented_text)

ORIGINAL TEXT:  The quick brown fox jumps over the lazy dog .
AUGMENTED TEXT:  the quick blue eye jumps over his lazy dog.


### Synonym Augmentation

In [3]:
text = 'The quick brown fox jumps over the lazy dog .'

syn_aug = naw.SynonymAug(aug_src='wordnet',aug_max=2)
syn_aug_text = syn_aug.augment(text,n=4)
print("ORIGINAL TEXT: ", text)
print("AUGMENTED TEXT: ",syn_aug_text)


ORIGINAL TEXT:  The quick brown fox jumps over the lazy dog .
AUGMENTED TEXT:  ['The speedy brownness fox jumps over the lazy dog.', 'The quick brown fox bound over the lazy andiron.', 'The quick brown dodger jumps all over the lazy dog.', 'The quick brown fox jump terminated the lazy dog.']


### BackTranslation

In [4]:
aug = naw.BackTranslationAug()
text = 'The quick brown fox jumps over the lazy dog .'

print("ORIGINAL TEXT: ", text)
print("AUGMENTED TEXT: ",aug.augment(text))

ORIGINAL TEXT:  The quick brown fox jumps over the lazy dog .
AUGMENTED TEXT:  The speedy brown fox jumps over the lazy dog.


### Abstractive Summary

In [5]:
import nltk

aug = nas.AbstSummAug()

paragraph = """ With the election fervour at its peak, a report by the Association for Democratic Reforms (ADR) revealed that assets of 78, that is, 77% of MLAs in the Punjab legislative assembly who are re-contesting in this year’s state elections, has seen a surge ranging from 2% to 2,954%. The average asset growth, based on the analysis of their poll affidavits, of these 101 MLAs between the 2017 and 2022 assembly elections is ₹2.76 crore.

According to the report, Sukhbir Singh Badal of Shiromani Akali Dal (SAD) from the Jalalabad constituency has declared the maximum increase in assets, by ₹100 crore. His assets increased from ₹102 crore in 2017 to ₹202 crore in 2022. He is followed by Manpreet Singh Badal of the Indian National Congress whose assets increased by ₹32 crore, from ₹40 crore in 2017 to ₹72 crore in 2022.

However, assets of 21 MLAs have dropped from -2% to -74% in the last five years. Among those are chief minister Charanjit Singh Channi, whose assets decreased from ₹14.51 crore in 2017 to ₹9.45 crore in 2022. Punjab Congress president Navjot Singh Sidhu, too, saw a slight decrease in assets, from ₹45.9 crore in 2017 to ₹44.65 crore this year.
"""
sent_list = nltk.sent_tokenize(paragraph)
pred = aug.augment(sent_list)
print(pred)

['a report by the association for democratic reforms (ADR) revealed that assets of 78, that is, 77% of MLAs in the Punjab legislative assembly who are re-contesting in this year’s state elections, has seen a surge ranging from 2% to 2,954%.', 'the average asset growth of these 101 MLAs between the 2017 and 2022 assembly elections is 2.76 crore.', 'Sukhbir Singh Badal of the Shiromani Akali Dal (SAD) from the Jalalabad constituency declared the maximum increase in assets, by 100 crore.', 'assets increased from 102 crore in 2017 to 202 crore in 2022.', 'he is followed by Manpreet Singh Badal of the Indian National Congress. his assets increased by 32 crore, from 40 crore in 2017 to 72 crore in 2022.', 'assets of 21 MLAs have dropped from -2% to -74% in the last five years.', 'among them is chief minister Charanjit Singh Channi. his assets decreased from 14.51 crore in 2017 to 9.45 crore in 2022.', 'Navjot Singh Sidhu sees a slight decrease in assets, from 45.9 crore in 2017 to 44.65 cror

In [6]:
aug = naw.BackTranslationAug()
print("AUGMENTED TEXT: ",aug.augment(pred))


AUGMENTED TEXT:  ["A report by the Association for Democratic Reform (ADR) found that the assets of 78, or 77% of the Punjab legislature's MLAs running again in this year's parliamentary elections, have risen between 2% and 2,954%.", 'The average wealth growth of these 101 MLAs between the 2017 and 2022 parliamentary elections is 2.76 crore.', 'Sukhbir Singh Badal of the Shiromani Akali Dal (SAD) from the Jalalabad constituency explained the maximum increase in assets by 100 crore.', 'Assets rose from 102 crore in 2017 to 202 crore in 2022.', 'He is succeeded by Manpreet Singh Badal of the Indian National Congress, whose wealth has increased by 32 crore, from 40 crore in 2017 to 72 crore in 2022.', 'The assets of 21 MLAs have fallen from -2% to -74% in the last five years.', 'Among them is Prime Minister Charanjit Singh Chan, whose wealth has fallen from $14.51 billion in 2017 to $9.45 billion in 2022.', 'Navjot Singh Sidhu sees a slight decline in assets, from 45.9 crore in 2017 to 44