In [1]:
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
import os
import shutil
import json
import re

pd.set_option('display.max_colwidth', None)

In [2]:
preds_dict = {}
for i in range(5):
    path = '../../../ceph_data/output/bart-AAE-v2-only-dot-direct-cola-au-full-mask-gen/{}/aee.preds'.format(i)
    path2 = '../../../ceph_data/intermediate/bart-AAE-v2-only-dot-direct-cola-au-full-mask-gen/{}/test.target'.format(i)
    with open(path, encoding='utf-8') as h:
        preds = h.readlines()
    with open(path2, encoding='utf-8') as f:
        gts = f.readlines()
    for pred, gt in zip(preds,gts):
        preds_dict[gt.replace('\n','')]=pred.replace('\n','')

In [3]:
df_aae_full = pd.read_csv('../../../ceph_data/input/UKP-InsufficientArguments_v1.0/data-tokenized.tsv', sep='\t', index_col=False, encoding='latin-1')
df_aae = pd.read_json('../../../ceph_data/intermediate/corpus-ukp-argument-annotated-essays-v2/aae3.json')
df_aae_invalid = pd.read_json('../../../ceph_data/intermediate/corpus-ukp-argument-annotated-essays-v2/aae3_invalid.json')
df_aae_fixed = pd.read_json('../../../ceph_data/intermediate/corpus-ukp-argument-annotated-essays-v2/aae3_fixed.json')
df_split = pd.read_csv('../../../ceph_data/input/UKP-InsufficientArguments_v1.0/data-splitting.tsv', sep='\t', names=['index']+[str(i) for i in range(100)], index_col=False)

df_aae_full['index'] = df_aae_full.apply(lambda x: 'essay{}_{}'.format(str(x['ESSAY']).zfill(3), x['ARGUMENT']), axis=1)
df_aae_full['local_sufficency'] = df_aae_full['ANNOTATION'].apply(lambda x: 0 if x == 'insufficient' else 1)


In [4]:
df_aae_full_mask = pd.read_csv('df_aae_full_mask.csv')

In [5]:
df_aae_full_mask.head()

Unnamed: 0.1,Unnamed: 0,index,local_sufficency,TEXT,TEXT_MASK
0,0,essay001_1,1.0,"through cooperation, children can learn about interpersonal skills which are significant in the future life of all students","First of all, <mask>. What we acquired from team work is not only how to achieve the same goal with others but more importantly, how to get along with others. During the process of cooperation, children can learn about how to listen to opinions of others, how to communicate with others, how to think comprehensively, and even how to compromise with other team members when conflicts occurred. All of these skills help them to get on well with other people and will benefit them for the whole life."
1,1,essay001_2,0.0,competition makes the society more effective,"On the other hand, the significance of competition is that how to become more excellence to gain the victory. Hence it is always said that <mask>. However, when we consider about the question that how to win the game, we always find that we need the cooperation. The greater our goal is, the more competition we need. Take Olympic games which is a form of competition for instance, it is hard to imagine how an athlete could win the game without the training of his or her coach, and the help of other professional staffs such as the people who take care of his diet, and those who are in charge of the medical care. The winner is the athlete but the success belongs to the whole team. Therefore <unk>."
2,2,essay002_1,0.0,sustaining the cultural values of immigrants is paramount essential,"Firstly, maintaining one’s cultural identity is a key important rule to help individuals emerge in the new multicultural environments. Take Australia for example, immigrants from varieties of nations have a day called multicultural day where people from each country prepare their food and traditional activities for displaying in the public venues. Many Australians come this day to enjoy the shows, learn about the cultures and admire the diverse values. These feedbacks, in turn, help raise one’s pride of their cultures and help people understand each other more. Thus this makes it clear that <mask>."
3,3,essay002_2,1.0,keeping the cultural traditions in the destination countries is tremendous important,"Secondly, it is crucial to keep one’s identity for they need a connection back to their country as well as teach their children their value of origin. For instance, children immigrated to a new country will face social troubles in school with new friends. In this new environment, parent should find friends coming from their same country so that they can socialize in a very familiar manner as feeling being home. Fail to create this familiarity makes them felt isolated, in the extreme can lead to social disorder like autism. Hence, it is clear that <mask>."
4,4,essay003_1,0.0,tourism has clearly improved lives in the tourist country,"Firstly, international tourism promotes many aspects of the destination country’s economy in order to serve various demands of tourists. Take Cambodia for example, a large number of visitors coming to visit the Angkowat ancient temple need services like restaurants, hotels, souvenir shops and other stores. These demands trigger related business in the surrounding settings which in turn create many jobs for local people improve infrastructure and living standard. Therefore <mask>."


In [6]:
only_claims = list(set(df_aae_full['index']) - set(df_aae['index']) - set(df_aae_invalid['index']))
df_aae_full_only_claims = df_aae_full[df_aae_full['index'].isin(only_claims)]

In [7]:
df_aae.columns

Index(['index', 'topic', 'para_text', 'premises', 'conclusion',
       'local_sufficency', 'au', 'major_claim'],
      dtype='object')

In [8]:
df_aae_full_only_claims.columns

Index(['ESSAY', 'ARGUMENT', 'TEXT', 'ANNOTATION', 'index', 'local_sufficency'], dtype='object')

In [9]:
df_aae_full_only_claims.head()

Unnamed: 0,ESSAY,ARGUMENT,TEXT,ANNOTATION,index,local_sufficency
46,20,3,"On the other hand , I believe that governments should restrict the use of products that cause air pollution for both individuals and companies . Governments also should use an amount of money from their budgets to clean up the air , instead of putting all the responsibility to companies and private individuals .",,essay020_3,1
528,205,1,"Firstly , a liberal policy is very feasible . Checking for attendance requires a lot of bureaucracy . Especially for larger classes it is impossible to check for everybody to attend . So an optional attendance saves time and money .",,essay205_1,1
826,315,2,"Another thing that put big cities in front of small towns is the facilitates and services it contains which support and improve the quality of its inhabitants ' lives , hospitals , advanced medical facilities can satisfy one ' s need of medical safety . Cultural events such as exhibitions and theatre plays can enrich one ' s and widen his horizons , things which aren ' t offered by small towns .",,essay315_2,1
876,335,1,"Firstly , connecting people by email is easy and fast . In addition , World Wide Web offers humanity to access to information , which they want to know for less than 10 seconds . These are two of the benefits , why IT is useful .",,essay335_1,1


In [10]:
df_aae_invalid.columns

Index(['index', 'topic', 'para_text', 'premises', 'conclusion',
       'local_sufficency', 'au', 'major_claim', 'removal_reason'],
      dtype='object')

In [11]:
conclusions_dict = {}
for i, row in df_aae.iterrows():
    if row['index'] not in conclusions_dict:
        conclusions_dict[row['index']] = []
    conclusions_dict[row['index']].append(row['conclusion'])
for i, row in df_aae_invalid.iterrows():
    if row['index'] not in conclusions_dict:
        conclusions_dict[row['index']] = []
    conclusions_dict[row['index']].append(row['conclusion'])
for i, row in df_aae_full_only_claims.iterrows():
    if row['index'] not in conclusions_dict:
        conclusions_dict[row['index']] = []
    conclusions_dict[row['index']].append('')

In [12]:
replaced_text_dict = {}
for index in df_aae_full_mask['index']:
    rel_df = df_aae_full_mask[df_aae_full_mask['index']==index]
    masked_text = None
    j = 0
    for i, row in rel_df.iterrows():
        if masked_text == None:
            masked_text = row['TEXT_MASK']
        #print(conclusions_dict[row['index']])
        #print(j)
        if conclusions_dict[row['index']][j] in preds_dict:
            masked_text = masked_text.replace('<mask>', '</s> ' + preds_dict[conclusions_dict[row['index']][j]] + ' </s>')
        else:
            masked_text = '</s> ' + row['TEXT'] + ' </s>'
        masked_text = masked_text.replace('<unk>', '<mask>')
        j += 1
    replaced_text_dict[index] = masked_text

In [13]:
df_aae_full['REPLACED_TEXT'] = df_aae_full['index'].apply(lambda x: replaced_text_dict[x])

In [15]:
df_aae_full.sample(20)

Unnamed: 0,ESSAY,ARGUMENT,TEXT,ANNOTATION,index,local_sufficency,REPLACED_TEXT
981,382,2,"Another point that students may benefit from technology is the shortened time for learning . The modern world provides learners with the mp3 , the mobile phone or the laptop that help them , especially language learners , listen to recordings everywhre or read documents anytime . Therefore , students will develop their skills at a greater pace . Moreover , the internet again , is an inexhaustible resource of visual aids , such as educational games , sounds or images with which students may absorb abstract concepts taught at school more briskly and thoroughly .",,essay382_2,1,"</s> the internet has also played a vital role in the development of students' skills </s>. The modern world provides learners with the mp3, the mobile phone or the laptop that help them, especially language learners, listen to recordings everywhre or read documents anytime. Therefore, students will develop their skills at a greater pace. Moreover, the internet again, is an inexhaustible resource of visual aids, such as educational games, sounds or images with which students may absorb abstract concepts taught at school more briskly and thoroughly."
519,201,3,"Finally , conservation leads us to a higher standard of living . I confess that art is one of the best ways of entertaining human beings , but , with exhaust fumes and acid rain , we do not have the energy and enthusiasm to appreciate the paintings or photographs . Biodiversity and a more beautiful nature are not only the results of abetter environment but also are the necessities of photography and other types of art .",,essay201_3,1,"Finally, </s> it is necessary to protect the environment </s>. I confess that art is one of the best ways of entertaining human beings, but, with exhaust fumes and acid rain, we do not have the energy and enthusiasm to appreciate the paintings or photographs. Biodiversity and a more beautiful nature are not only the results of abetter environment but also are the necessities of photography and other types of art."
839,320,1,"To begin with , type of temper is one of the reasons that make me to choose individual work instead of team one . Being by nature introvert , I have to spend much time and efforts on adjusting to surroundings and especially new people . Once , when I was working on presentation with strangers , I sat aside and so prepared more than half of work myself instead of making attempts to get acquainted with unknown people . Therefore , my productivity boosts when style of work is appropriate with my type of temper .",,essay320_1,1,"To begin with, type of temper is one of the reasons that make me to choose individual work instead of team one. Being by nature introvert, I have to spend much time and efforts on adjusting to surroundings and especially new people. Once, when I was working on presentation with strangers, I sat aside and so prepared more than half of work myself instead of making attempts to get acquainted with unknown people. Therefore, </s> to be a part of a team, I would prefer to work on my own </s>."
74,30,3,"Furthermore , this will encourage all the parents to think of the way to help their children to achieve more in their lives as they need to make some contribution too for their children future .",,essay030_3,1,"Furthermore, </s> Furthermore, parents should be responsible for their children </s> as they need to make some contribution too for their children future."
951,369,2,"Secondly , even though environmental damage is inevitable , it is not tourism to be blamed for . In order to turn a wilderness into a place of attraction , the planners must have taken the nourishment of the sceneries into thorough consideration . To be precise , for instance , a fortune is spent on trimming the trees , watering the flowers , preserving and balancing the local fauna and flora , in the hope of beautifying the wild . Not to mention ecotourism , a new kind of environment-friendly service , which gives all environmentalists and nature lovers a hand in raising the awareness of people in protecting their coexistent creatures . Because of that , tourism should not be alledged to be notorous for its detriment to the ecological diversity .",,essay369_2,1,"Secondly, even though environmental damage is inevitable, it is not tourism to be blamed for. In order to turn a wilderness into a place of attraction, the planners must have taken the nourishment of the sceneries into thorough consideration. To be precise, for instance, a fortune is spent on trimming the trees, watering the flowers, preserving and balancing the local fauna and flora, in the hope of beautifying the wild. Not to mention ecotourism, a new kind of environment-friendly service, which gives all environmentalists and nature lovers a hand in raising the awareness of people in protecting their coexistent creatures. Because of that, </s> tourism is not the best way to protect the environment </s>."
139,58,1,"Co-operation is essential for teamwork . Educational systems emphasize on encouraging co-operative approach in children . We live in a social setup and mutual help and sharing only leads to success . A person can not learn or achieve everything by oneself . For instance , lions hunt in a team . It is only due to their teamwork that they are able to catch a prey and make task easy . In the same way , co-operative approach will save time , energy and will have a higher success rate .",insufficient,essay058_1,0,"</s> co-operative approach is the best way to learn </s>. Educational systems emphasize on encouraging co-operative approach in children. We live in a social setup and mutual help and sharing only leads to success. A person can not learn or achieve everything by oneself. For instance, lions hunt in a team. It is only due to their teamwork that they are able to catch a prey and make task easy. In the same way, co-operative approach will save time, energy and will have a higher success rate."
922,356,2,"However , flourishing tourism in a place can be very rewarding in terms of local economy . Holiday makers flocking to other countries are not only bound to spend on tickets of attractions , but also pay for food , accommodation , transportation and entertainment . Both local people and governments can make a large amount of money through these services , and more employment opportunities can be created as well . I also believe the revenue earned form tourism can be used in turn to reduce pollution and protect the environment .",,essay356_2,1,"However, </s> tourism can be a great source of income for the local people </s>. Holiday makers flocking to other countries are not only bound to spend on tickets of attractions, but also pay for food, accommodation, transportation and entertainment. Both local people and governments can make a large amount of money through these services, and more employment opportunities can be created as well. I also believe the revenue earned form tourism can be used in turn to reduce pollution and protect the environment."
928,359,1,"There is no doubt that some behaviors of the tourists are not welcome in the local area . Firstly , some people leave the rubbish after visiting the attractions . Therefore , those local residents have to clean the place frequently so that the new batch of tourists will have a tidy and neat environment . Moreover , tourists may offend the local people due to their different culture background . For example , Indians don ' t eat beef since they worship cows . Thus , if tourists want to respect the tradition , they will not order any beef in the local restaurant .",insufficient,essay359_1,0,"There is no doubt that </s> there are some disadvantages to tourism </s>. Firstly, some people leave the rubbish after visiting the attractions. Therefore, those local residents have to clean the place frequently so that the new batch of tourists will have a tidy and neat environment. Moreover, tourists may offend the local people due to their different culture background. For example, Indians don't eat beef since they worship cows. Thus, if tourists want to respect the tradition, they will not order any beef in the local restaurant."
189,76,2,"On the other hand , some people oppose the argument , saying it is a waste of public money for the government to subsidize health care and education of each citizen in society , since a great number of people , in fact , have had the capacity to pay for the both privately . Instead , the government should give priority to more pressing problems related to social members ' wellbeing , such as soaring crime rate , AIDS epidemic or the shortage of infrastructure , which are requiring financial resources from the government to address .",,essay076_2,1,"On the other hand, some people oppose the argument, saying </s> the government should not spend more money on health care and education </s>, since a great number of people, in fact, have had the capacity to pay for the both privately. Instead, the government should give priority to more pressing problems related to social members' wellbeing, such as soaring crime rate, AIDS epidemic or the shortage of infrastructure, which are requiring financial resources from the government to address."
481,188,2,"Daily exercise will help also to develop children ' s brain function . It is well known how important it is to exercise regularly to help the body system to work better . When people exercise , the respiratory system ' s function is enhanced , helping all organs , including the brain , to get more oxygen in . Daily exercise will provide children with a mental break which will boost them to be efficient learners .",,essay188_2,1,"</s> it is important for children to be physically active </s>. It is well known how important it is to exercise regularly to help the body system to work better. When people exercise, the respiratory system's function is enhanced, helping all organs, including the brain, to get more oxygen in. Daily exercise will provide children with a mental break which will boost them to be efficient learners."


In [16]:
df_aae_full[df_aae_full['index'].isin(df_aae_invalid['index'])]

Unnamed: 0,ESSAY,ARGUMENT,TEXT,ANNOTATION,index,local_sufficency,REPLACED_TEXT
1,1,2,"On the other hand , the significance of competition is that how to become more excellence to gain the victory . Hence it is always said that competition makes the society more effective . However , when we consider about the question that how to win the game , we always find that we need the cooperation . The greater our goal is , the more competition we need . Take Olympic games which is a form of competition for instance , it is hard to imagine how an athlete could win the game without the training of his or her coach , and the help of other professional staffs such as the people who take care of his diet , and those who are in charge of the medical care . The winner is the athlete but the success belongs to the whole team . Therefore without the cooperation , there would be no victory of competition .",insufficient,essay001_2,0,"On the other hand, the significance of competition is that how to become more excellence to gain the victory. Hence it is always said that </s> competition is a form of cooperation </s>. However, when we consider about the question that how to win the game, we always find that we need the cooperation. The greater our goal is, the more competition we need. Take Olympic games which is a form of competition for instance, it is hard to imagine how an athlete could win the game without the training of his or her coach, and the help of other professional staffs such as the people who take care of his diet, and those who are in charge of the medical care. The winner is the athlete but the success belongs to the whole team. Therefore </s> competition is a form of cooperation </s>."
21,10,1,"First and foremost , carbon emission cut is significantly essential for protecting the atmosphere . The fact is that the more cars and motorbikes are on roads , the more seriously the ozone layer is damaged . If governments use more money to improve roads , there is a strong likelihood that more people drive their private cars work . This is sure to lead to more carbon emitted into the atmosphere , which can cause skin cancer and destroy the natural environment . Whereas , if there are more good buses , trains , or subways , people are inclined to use less private vehicles , which decreases the amount of carbon released . Obviously , the policy that concentrates money on developing public transportation brings an advantageous impact on earth .",,essay010_1,1,"First and foremost, carbon emission cut is significantly essential for protecting the atmosphere. The fact is that the more cars and motorbikes are on roads, the more seriously the ozone layer is damaged. If governments use more money to improve roads, there is a strong likelihood that more people drive their private cars work. </s> first and foremost, it is important to reduce the number of cars and motorbikes </s>. Whereas, if there are more good buses, trains, or subways, people are inclined to use less private vehicles, which decreases the amount of carbon released. Obviously, </s> first and foremost, there is a need to reduce the number of cars and motorbikes </s>."
25,11,3,"Last , but not least , financial sustainability of a region mostly depends on how healthy the population is . For instance , the money invested into physical education program can save allocations into healthcare , since the nation is comparatively healthy . Along with that , physically healthy people can contribute more both into economical and social development . As a matter of fact , the better a person feels , the better his brain works . Therefore , putting physical activities in early steps of human development would finally lead to mentally healthy society . As hence it ends up with financially competitive country .",,essay011_3,1,"Last, but not least, </s> Physical education can improve the health of the nation </s>. For instance, the money invested into physical education program can save allocations into healthcare, since the nation is comparatively healthy. Along with that, physically healthy people can contribute more both into economical and social development. As a matter of fact, the better a person feels, the better his brain works. Therefore, </s> Physical education can improve the health of the nation </s>. As hence it ends up with financially competitive country."
48,21,2,"Also , the more an advertisement of a product takes place in mass media , the more popular the product becomes . Advertisement is the most effective way to create a well-known product . Consumers tend to purchase the most known product when it comes to picking one out of two different brands of the same product . When a product is commonly used , it becomes trustworthy for the society , no matter what quality it is . However , it also has to be affordable for the consumer . Considering this fact , advertisements have undeniable affects on the society about the product being advertised . They make the product preferable .",,essay021_2,1,"Also, the more an advertisement of a product takes place in mass media, the more popular the product becomes. </s> advertising has an impact on the society </s>. Consumers tend to purchase the most known product when it comes to picking one out of two different brands of the same product. When a product is commonly used, it becomes trustworthy for the society, no matter what quality it is. However, it also has to be affordable for the consumer. Considering this fact, advertisements have undeniable affects on the society about the product being advertised. </s> advertising has an impact on the society </s>."
115,47,1,"To begin with , it is the right of wild species to live in a environment away from human beings . Given the fact that human beings are responsible for the heavy pollution and severe damage to the natural habitats of many wild animals , it is our responsibility to create a natural and safe environment for animals to live in . Apparently , the limited space and the artificial trees and lakes can not fully compensate the animals for their loss . Moreover , if rural animals are captured in the zoo for a long period , it would have negative influences on both the physical and psychological status of the creatures . As a result , the wild species would suffer from isolation and depression . It seems that zoos are more likely to be a killer rather than a protector in protecting wild lives .",,essay047_1,1,"To begin with, it is the right of wild species to live in a environment away from human beings. Given the fact that human beings are responsible for the heavy pollution and severe damage to the natural habitats of many wild animals, </s> wild animals have a right to live in a natural environment </s>. Apparently, the limited space and the artificial trees and lakes can not fully compensate the animals for their loss. Moreover, if rural animals are captured in the zoo for a long period, it would have negative influences on both the physical and psychological status of the creatures. As a result, the wild species would suffer from isolation and depression. It seems that </s> wild animals have a right to live in a natural environment </s>."
117,48,1,"To begin with , distance-learning brings significant convenience for students in every corner of the world . In earlier times , students who were tired of commuting had to attend schools nearby , regardless of any differences in teaching facilities , teacher ' s qualifications or the school reputation . Now , however , students are able to apply for online-courses provided by top-of-the-range universities and colleges worldwide . Furthermore , the presence of video conferencing allows a teacher to teach a greater number of students . Consequently , educational institutions are able to optimize costs by increasing teacher-student ratios . Thanks to the economical online-teaching , universities and colleges are able to offer grants for students who have outstanding academic achievements but are unable to attend schools because of financial constrains .",,essay048_1,1,"To begin with, </s> the advantages of online-teaching are obvious </s>. In earlier times, students who were tired of commuting had to attend schools nearby, regardless of any differences in teaching facilities, teacher's qualifications or the school reputation. Now, however, students are able to apply for online-courses provided by top-of-the-range universities and colleges worldwide. Furthermore, the presence of video conferencing allows a teacher to teach a greater number of students. Consequently, </s> the advantages of online-teaching are obvious </s>. Thanks to the economical online-teaching, universities and colleges are able to offer grants for students who have outstanding academic achievements but are unable to attend schools because of financial constrains."
123,51,1,"First , I think a library is vital and strategical part of a university . All professors and students need to have a modern and well-equipped library because , after internet , library plays an important role in research . Although sport is important , it does not have the same priority of library has . In addition only small part of students attend sport activities . For example , in my university number of students who use the library is much more than students do sports activities .",insufficient,essay051_1,0,"First, I think a library is vital and strategical part of a university. </s> first of all universities should have a library </s> because, after internet, library plays an important role in research. Although sport is important, </s> first of all universities should have a library </s>. In addition only small part of students attend sport activities. For example, in my university number of students who use the library is much more than students do sports activities."
131,54,2,"On the other hand , the importance of museums and art galleries is plain in terms of education and culture . First of all , authentic exhibits cannot be completely displayed only by images and videos . It is like travelling to a place is much better than viewing the landscape of that place on TV or photos , so the best method to learn one thing is to experience it . Furthermore , museums and art galleries preserve some culture heritages ; therefore , these buildings will not disappear unless people abandon their culture .",,essay054_2,1,"On the other hand, </s> museums and art galleries are the best way to learn about a place </s>. First of all, authentic exhibits cannot be completely displayed only by images and videos. It is like travelling to a place is much better than viewing the landscape of that place on TV or photos, so the best method to learn one thing is to experience it. Furthermore, museums and art galleries preserve some culture heritages; therefore, </s> museums and art galleries are the best way to learn about a place </s>."
182,73,1,"Firstly , pictures can influence the way people think . For example , nowadays horrendous images are displayed on the cigarette boxes to illustrate the consequences of smoking . As a result , statistics show a slight reduction in the number of smokers , indicating that they realize the effects of the negative habit . Not only that , the magnificent photograph captured by Kevin Carter , which portrayed a starving Sudanese child struck by extreme poverty has successfully highlighted the plight faced by the citizens in Sudan . Apart from that , images are also widely used in newspapers , magazines and advertisements . Thus , it is undeniable that images in the absence of words can obviously claim the attraction of many .",insufficient,essay073_1,0,"Firstly, </s> smoking has been affected by the use of images </s>. For example, nowadays horrendous images are displayed on the cigarette boxes to illustrate the consequences of smoking. As a result, statistics show a slight reduction in the number of smokers, indicating that they realize the effects of the negative habit. Not only that, the magnificent photograph captured by Kevin Carter, which portrayed a starving Sudanese child struck by extreme poverty has successfully highlighted the plight faced by the citizens in Sudan. Apart from that, images are also widely used in newspapers, magazines and advertisements. Thus, </s> smoking has been affected by the use of images </s>."
204,82,1,"First , it is generally understood that advertising is carried out with the main purpose of promoting different products and services or encouraging people to consume more . Advertisements are , therefore , very important for many businesses to increase sales and hence profits . Also , to consumers , advertising can bring them many benefits . For example , customers of telecommunication services will have an idea about the current offers of different companies and hence they can compare them and then have a better decision in choosing their internet or mobile phone plans . From all of these , it is easy to see why the idea that advertising is a positive part of life will garner strong support .",insufficient,essay082_1,0,"First, it is generally understood that advertising is carried out with the main purpose of promoting different products and services or encouraging people to consume more. </s> advertising is a positive part of life </s>. Also, </s> advertising is a positive part of life </s>. For example, customers of telecommunication services will have an idea about the current offers of different companies and hence they can compare them and then have a better decision in choosing their internet or mobile phone plans. From all of these, it is easy to see why the idea that advertising is a positive part of life will garner strong support."


In [17]:
df_aae_full['placeholder1'] = np.arange(len(df_aae_full))
df_aae_full['placeholder2'] = np.arange(len(df_aae_full))
df_aae_full['placeholder3'] = np.arange(len(df_aae_full))

path = '../../../ceph_data/intermediate/bert-AAE-v2-only-dot-direct-cola-au-full-replaced'
if not os.path.exists(path):
    os.mkdir(path)
else:
    shutil.rmtree(path)
    os.mkdir(path)
    
path2 = '../../../ceph_data/output/bert-AAE-v2-only-dot-direct-cola-au-full-replaced'
if not os.path.exists(path2):
    os.mkdir(path2)
else:
    shutil.rmtree(path2)
    os.mkdir(path2)

for i in range(100):
    if not os.path.exists(path+'/{}'.format(i)):
        os.mkdir(path+'/{}'.format(i))
    else:
        shutil.rmtree(path+'/{}'.format(i))
        os.mkdir(path+'/{}'.format(i))
        
    if not os.path.exists(path2+'/{}'.format(i)):
        os.mkdir(path2+'/{}'.format(i))
    else:
        shutil.rmtree(path2+'/{}'.format(i))
        os.mkdir(path2+'/{}'.format(i))
    
    split_dict = dict(zip(df_split['index'], df_split[str(i)]))
    df_aae_full['split'] = df_aae_full['index'].apply(lambda x: split_dict[x])
    df_aae_full[df_aae_full['split']=='TRAIN'][['local_sufficency','placeholder1','placeholder2','REPLACED_TEXT','placeholder3']].to_csv('../../../ceph_data/intermediate/bert-AAE-v2-only-dot-direct-cola-au-full-replaced/'+str(i)+'/train.tsv',sep='\t', index=False)
    df_aae_full[df_aae_full['split']=='DEV'][['local_sufficency','placeholder1','placeholder2','REPLACED_TEXT','placeholder3']].to_csv('../../../ceph_data/intermediate/bert-AAE-v2-only-dot-direct-cola-au-full-replaced/'+str(i)+'/dev.tsv',sep='\t', index=False)
    df_aae_full[df_aae_full['split']=='TEST'][['local_sufficency','placeholder1','placeholder2','REPLACED_TEXT','placeholder3']].to_csv('../../../ceph_data/intermediate/bert-AAE-v2-only-dot-direct-cola-au-full-replaced/'+str(i)+'/test.tsv',sep='\t', index=False)
