In [1]:
from os import getcwd
from os.path import join, dirname
import nlpaug.augmenter.word as naw
import nlpaug.augmenter.char as nac

import sys
PATH_REPO = dirname(getcwd())
PATH_UTILS = join(PATH_REPO, 'utils')
sys.path.append(PATH_UTILS)

In [2]:
import augmentation

### 1. Synonim Augmentation using wordnet

We replace nouns and adjectives by a synonim using Wordnet

In [3]:
text = "I like you because I think you are really smart my friend"
print(f"The original text is: \n{text}")
transformed_text = augmentation.get_syn_sentence(text)
print(f"the transformed text using wordnet is: \n{transformed_text}")

The original text is: 
I like you because I think you are really smart my friend
the transformed text using wordnet is: 
I like you because I think you are really saucy my protagonist


### 2. Negation + Antonym Augmentation using wordnet

We replace nouns and adjectives by "not + antonym"

In [4]:
text = "I like you because I think you are really smart my friend"
print(f"The original text is: \n{text}")
transformed_text = augmentation.get_neg_ant_sentence(text)
print(f"the transformed text using wordnet is: \n{transformed_text}")

The original text is: 
I like you because I think you are really smart my friend
the transformed text using wordnet is: 
I like you because I think you are really not stupid my not foe


### 3. Nlpaug for adding stopwords

In [5]:
aug = naw.ContextualWordEmbsAug(model_path='bert-base-uncased', action="insert")
text = "I like you because I think you are really smart my friend"
print(f"The original text is: \n{text}")
transformed_text = aug.augment(text)[0]
print(f"the transformed text using wordnet is: \n{transformed_text}")

The original text is: 
I like you because I think you are really smart my friend
the transformed text using wordnet is: 
now i quite like teasing you because again i think you are really smart my friend


### 4. Nlpaug adding characters (typos etc)

In [6]:
aug_char = nac.OcrAug() 
text = "I like ºyou because I think you are really smart my friend"
print(f"The original text is: \n{text}")
transformed_text = aug_char.augment(text)[0]
print(f"the transformed text using wordnet is: \n{transformed_text}")

The original text is: 
I like ºyou because I think you are really smart my friend
the transformed text using wordnet is: 
I like ºyou because 1 think y0o ake rea11y smart my friend


### 5. Backtranslation

In [7]:
text = "I like you because I think you are really smart my friend"
print(f"The original text is: \n{text}")
transformed_text = augmentation.backtranslate_text(text)
print(f"the transformed text using wordnet is: \n{transformed_text}")

The original text is: 
I like you because I think you are really smart my friend
the transformed text using wordnet is: 
I like you because I think you are very smart my friend


### 6. NER transformation

In [8]:
text = "I want to go to Barcelona and visit the offices of Apple"
print(f"The original text is: \n{text}")
transformed_text = augmentation.ner_augment(text)
print(f"the transformed text using wordnet is: \n{transformed_text}")

The original text is: 
I want to go to Barcelona and visit the offices of Apple
the transformed text using wordnet is: 
I want to go to Miami and visit the offices of Sun


### 7. Change singular to plural

In [9]:
text = "I like you because I think you are really smart my friend"
print(f"The original text is: \n{text}")
transformed_text = augmentation.plural_transform(text)
print(f"the transformed text using wordnet is: \n{transformed_text}")

The original text is: 
I like you because I think you are really smart my friend
the transformed text using wordnet is: 
I like you because I think you are really smarts my friends


### 8. Change plural to singular

In [10]:
text = "Tomorrow bring me my pencils"
print(f"The original text is: \n{text}")
transformed_text = augmentation.singular_transform(text)
print(f"the transformed text using wordnet is: \n{transformed_text}")

The original text is: 
Tomorrow bring me my pencils
the transformed text using wordnet is: 
Tomorrow bring me my pencil
