# Preparing the training dataset

In [1]:
import pandas as pd

### First we import the dataset

In [2]:
all_questions = pd.read_csv('../res/QnA.csv', header=None, index_col=False)

In [3]:
all_questions

Unnamed: 0,0,1
0,What Happens When Term Life Insurance Is Paid Up?,Actually term life insurance cannot be paid up...
1,What Happens When Term Life Insurance Is Paid Up?,Term life insurance is never paid up. Assuming...
2,What Happens When Term Life Insurance Is Paid Up?,Term Life Insurance does not have the option t...
3,What Does Renters Insurance Cover?,A renters insurance policy will typically prov...
4,What Does Renters Insurance Cover?,If you apartment was on fire and all your pers...
...,...,...
27989,What is,I'm not sure.\n
27990,Can I,I'm not sure.\n
27991,Which,I'm not sure.\n
27992,Does,I'm not sure.\n


In [4]:
all_questions.columns = ['Question', 'Answer']

In [5]:
all_questions.head()

Unnamed: 0,Question,Answer
0,What Happens When Term Life Insurance Is Paid Up?,Actually term life insurance cannot be paid up...
1,What Happens When Term Life Insurance Is Paid Up?,Term life insurance is never paid up. Assuming...
2,What Happens When Term Life Insurance Is Paid Up?,Term Life Insurance does not have the option t...
3,What Does Renters Insurance Cover?,A renters insurance policy will typically prov...
4,What Does Renters Insurance Cover?,If you apartment was on fire and all your pers...


In [6]:
all_questions.head(20)

Unnamed: 0,Question,Answer
0,What Happens When Term Life Insurance Is Paid Up?,Actually term life insurance cannot be paid up...
1,What Happens When Term Life Insurance Is Paid Up?,Term life insurance is never paid up. Assuming...
2,What Happens When Term Life Insurance Is Paid Up?,Term Life Insurance does not have the option t...
3,What Does Renters Insurance Cover?,A renters insurance policy will typically prov...
4,What Does Renters Insurance Cover?,If you apartment was on fire and all your pers...
5,Does Owning A Pitbull Raise Homeowners Insurance?,Most insurance companies do not surcharge for ...
6,What Should You Look For In Long Term Care Ins...,Every product purchase has a value proposition...
7,Will Medicare Pay For Smoking Cessation?,Medicare will not pay for smoking cessation pr...
8,What Is Eoi For Life Insurance?,"EOI in life insurance stands for ""evidence of ..."
9,What Companies Will Issue Life Insurance To Th...,None that I know of will underwrite a mentally...


In [7]:
all_questions.iloc[0]

Question    What Happens When Term Life Insurance Is Paid Up?
Answer      Actually term life insurance cannot be paid up...
Name: 0, dtype: object

### We are first dropping all duplicate questions from our dataset

In [8]:
all_questions_unique = all_questions.drop_duplicates(subset='Question')

In [9]:
all_questions_unique

Unnamed: 0,Question,Answer
0,What Happens When Term Life Insurance Is Paid Up?,Actually term life insurance cannot be paid up...
3,What Does Renters Insurance Cover?,A renters insurance policy will typically prov...
5,Does Owning A Pitbull Raise Homeowners Insurance?,Most insurance companies do not surcharge for ...
6,What Should You Look For In Long Term Care Ins...,Every product purchase has a value proposition...
7,Will Medicare Pay For Smoking Cessation?,Medicare will not pay for smoking cessation pr...
...,...,...
27989,What is,I'm not sure.\n
27990,Can I,I'm not sure.\n
27991,Which,I'm not sure.\n
27992,Does,I'm not sure.\n


In [10]:
all_questions_unique.tail(20)

Unnamed: 0,Question,Answer
27969,What Auto Insurance Limits Should I Have?,"The higher your liability limits, the less lik..."
27970,Is Medigap The Same As Supplemental Insurance?,Yes. When you hear the term Medicare Supplemen...
27971,Does Life Insurance Go To Credit Card Debt?,If you are the beneficiary of life insurance p...
27973,What Is Medigap Plan F?,Medigap plan F is the most popular Medigap pla...
27974,Who Is Eligible For USAA Life Insurance?,Persons who are members of USAA are eligible f...
27975,Is A Life Insurance Trust A Living Trust?,"When talking about a life insurance trust, mos..."
27976,Is Employer Provided Life Insurance Taxable?,"Yes, employer provided life insurance is taxab..."
27977,Which Retirement Plans Are Qualified?,A Qualified Retirement Plan is a plan that is ...
27978,Does Homeowners Insurance Cover A Shed?,"In many cases, Homeowners' Insurance policies ..."
27980,Why Do You Have To Have Car Insurance?,To protect yourself against financial devistat...


### Also we will drop the final 7 rows, as those are not good examples for our training set

In [11]:
all_questions_unique = all_questions_unique.drop(all_questions_unique.tail(7).index)

In [12]:
all_questions_unique

Unnamed: 0,Question,Answer
0,What Happens When Term Life Insurance Is Paid Up?,Actually term life insurance cannot be paid up...
3,What Does Renters Insurance Cover?,A renters insurance policy will typically prov...
5,Does Owning A Pitbull Raise Homeowners Insurance?,Most insurance companies do not surcharge for ...
6,What Should You Look For In Long Term Care Ins...,Every product purchase has a value proposition...
7,Will Medicare Pay For Smoking Cessation?,Medicare will not pay for smoking cessation pr...
...,...,...
27978,Does Homeowners Insurance Cover A Shed?,"In many cases, Homeowners' Insurance policies ..."
27980,Why Do You Have To Have Car Insurance?,To protect yourself against financial devistat...
27981,Can Someone Buy Life Insurance For Someone Else?,The operative word in this question is for. Yo...
27983,How Much Home Insurance Do I Need?,How much home insurance do you want? Do you wa...


In [13]:
all_questions_unique.tail(10)

Unnamed: 0,Question,Answer
27973,What Is Medigap Plan F?,Medigap plan F is the most popular Medigap pla...
27974,Who Is Eligible For USAA Life Insurance?,Persons who are members of USAA are eligible f...
27975,Is A Life Insurance Trust A Living Trust?,"When talking about a life insurance trust, mos..."
27976,Is Employer Provided Life Insurance Taxable?,"Yes, employer provided life insurance is taxab..."
27977,Which Retirement Plans Are Qualified?,A Qualified Retirement Plan is a plan that is ...
27978,Does Homeowners Insurance Cover A Shed?,"In many cases, Homeowners' Insurance policies ..."
27980,Why Do You Have To Have Car Insurance?,To protect yourself against financial devistat...
27981,Can Someone Buy Life Insurance For Someone Else?,The operative word in this question is for. Yo...
27983,How Much Home Insurance Do I Need?,How much home insurance do you want? Do you wa...
27986,Does Geico Have Health Insurance?,I'm not aware of Geico having health insurance...


### Now that we have dataset with unique questions, we will start building our training dataset

In [14]:
sample_100_questions = all_questions_unique.sample(n=100, random_state=6)

In [15]:
sample_100_questions

Unnamed: 0,Question,Answer
26107,Where Do You Get Disability Insurance?,If disability benefits are not offered through...
17770,Does Each Tenant Need Renters Insurance?,It is always wise for a tenant to carry Renter...
20809,Can Life Insurance Refuse To Pay?,Life insurance companies can refuse to pay the...
15750,Does Long Term Care Insurance Cover Assisted L...,"Yes, Long Term Care Insurance often covers ass..."
12859,How Do I Choose A Medigap Plan?,It can be overwhelming research Medigap on you...
...,...,...
20536,What To Look For In A Good Health Insurance Plan?,"The definition of ""good"" varies from person to..."
14299,Does Suze Orman Hate Whole Life Insurance?,Suze Orman usually does not recommend Whole Li...
14207,How Much Does It Cost To Add A Named Driver To...,This is nearly impossible to answer as the rat...
21128,Is Disability Insurance The Same As Workers Co...,"No, they are not the same. Workers compensatio..."


In [16]:
sample_100_questions.to_csv('100_questions.csv', index=False)

### Saving indices of the sampled rows, to delete them from all_questions_unique dataset

In [17]:
sample_100_questions_indices = sample_100_questions.index

In [18]:
sample_100_questions_indices

Index([26107, 17770, 20809, 15750, 12859, 20679,   446, 11337, 15753, 26840,
        5643,  1400,   833,  5641, 23751,  9408, 21088, 12754, 14932, 13489,
       14825,  3805,  6774,  7468,  6266,  9000,   910, 22103, 25708, 11370,
        7600,  4666, 15915, 12275,  1445, 16851,  5237,  9901, 19147, 21132,
       24103, 15755, 21370, 17435, 22526,  7341,  2213, 21896,  3767, 10822,
       26525,  4624, 27780,  3536,  7359, 22230,  9500,  5673,  2612, 24452,
       10837, 19873,  4390,  3245,  2709,  4109, 15123,  6210, 10555,  8386,
        3054,  2378,  6138,  1987,  5216, 15331,  1516, 22433, 20178, 10899,
        6322,  4191, 17095, 14928, 16402,  3120, 24536,  6807, 19332, 14476,
       20561,    68, 18927, 15734,  7581, 20536, 14299, 14207, 21128,   659],
      dtype='int64')

### Deleting sample_100_questions from all_questions_unique -> so that we are left with distinct questions only

In [19]:
all_questions_unique_remaining = all_questions_unique.drop(sample_100_questions_indices)

In [20]:
all_questions_unique_remaining

Unnamed: 0,Question,Answer
0,What Happens When Term Life Insurance Is Paid Up?,Actually term life insurance cannot be paid up...
3,What Does Renters Insurance Cover?,A renters insurance policy will typically prov...
5,Does Owning A Pitbull Raise Homeowners Insurance?,Most insurance companies do not surcharge for ...
6,What Should You Look For In Long Term Care Ins...,Every product purchase has a value proposition...
7,Will Medicare Pay For Smoking Cessation?,Medicare will not pay for smoking cessation pr...
...,...,...
27978,Does Homeowners Insurance Cover A Shed?,"In many cases, Homeowners' Insurance policies ..."
27980,Why Do You Have To Have Car Insurance?,To protect yourself against financial devistat...
27981,Can Someone Buy Life Insurance For Someone Else?,The operative word in this question is for. Yo...
27983,How Much Home Insurance Do I Need?,How much home insurance do you want? Do you wa...


### Sampling another 100 (distinct/dissimilar) questions from all_questions_unique_remaining -> and adding them to sample_100_questions (as columns)

In [21]:
distinct_sample = all_questions_unique_remaining.sample(n=100, random_state=66).reset_index(drop=True)

In [22]:
distinct_sample

Unnamed: 0,Question,Answer
0,Is Long Term Disability Insurance The Same As ...,Although both insurance products are morbidity...
1,Does Your Spouse Have To Be Your Beneficiary F...,No your spouse is not required to be the benef...
2,How Much Is Enough Auto Insurance Coverage?,A client who had just purchased a $3 million P...
3,Is Long Term Care Insurance Regulated?,All Insurance companies are regulated by the N...
4,Can You Change From Medicare Advantage To Medi...,You can disenroll from your Medicare Advantage...
...,...,...
95,Can You Get Life Insurance If You Skydive?,That's a great question! Most insurance compan...
96,Do Life Insurance Agents Really Care Or Do The...,Having been in this business for more than 30 ...
97,Is Mental Health Covered By Insurance?,Great question! One of the great things about ...
98,Can You Have Two Long Term Disability Insuranc...,Yes. Many people have two disability policies....


In [23]:
combined_sample = pd.concat([sample_100_questions.reset_index(drop=True), distinct_sample], axis=1)

In [24]:
combined_sample

Unnamed: 0,Question,Answer,Question.1,Answer.1
0,Where Do You Get Disability Insurance?,If disability benefits are not offered through...,Is Long Term Disability Insurance The Same As ...,Although both insurance products are morbidity...
1,Does Each Tenant Need Renters Insurance?,It is always wise for a tenant to carry Renter...,Does Your Spouse Have To Be Your Beneficiary F...,No your spouse is not required to be the benef...
2,Can Life Insurance Refuse To Pay?,Life insurance companies can refuse to pay the...,How Much Is Enough Auto Insurance Coverage?,A client who had just purchased a $3 million P...
3,Does Long Term Care Insurance Cover Assisted L...,"Yes, Long Term Care Insurance often covers ass...",Is Long Term Care Insurance Regulated?,All Insurance companies are regulated by the N...
4,How Do I Choose A Medigap Plan?,It can be overwhelming research Medigap on you...,Can You Change From Medicare Advantage To Medi...,You can disenroll from your Medicare Advantage...
...,...,...,...,...
95,What To Look For In A Good Health Insurance Plan?,"The definition of ""good"" varies from person to...",Can You Get Life Insurance If You Skydive?,That's a great question! Most insurance compan...
96,Does Suze Orman Hate Whole Life Insurance?,Suze Orman usually does not recommend Whole Li...,Do Life Insurance Agents Really Care Or Do The...,Having been in this business for more than 30 ...
97,How Much Does It Cost To Add A Named Driver To...,This is nearly impossible to answer as the rat...,Is Mental Health Covered By Insurance?,Great question! One of the great things about ...
98,Is Disability Insurance The Same As Workers Co...,"No, they are not the same. Workers compensatio...",Can You Have Two Long Term Disability Insuranc...,Yes. Many people have two disability policies....


In [25]:
combined_sample.to_csv('combined_sample.csv', index=False)

In [26]:
combined_sample

Unnamed: 0,Question,Answer,Question.1,Answer.1
0,Where Do You Get Disability Insurance?,If disability benefits are not offered through...,Is Long Term Disability Insurance The Same As ...,Although both insurance products are morbidity...
1,Does Each Tenant Need Renters Insurance?,It is always wise for a tenant to carry Renter...,Does Your Spouse Have To Be Your Beneficiary F...,No your spouse is not required to be the benef...
2,Can Life Insurance Refuse To Pay?,Life insurance companies can refuse to pay the...,How Much Is Enough Auto Insurance Coverage?,A client who had just purchased a $3 million P...
3,Does Long Term Care Insurance Cover Assisted L...,"Yes, Long Term Care Insurance often covers ass...",Is Long Term Care Insurance Regulated?,All Insurance companies are regulated by the N...
4,How Do I Choose A Medigap Plan?,It can be overwhelming research Medigap on you...,Can You Change From Medicare Advantage To Medi...,You can disenroll from your Medicare Advantage...
...,...,...,...,...
95,What To Look For In A Good Health Insurance Plan?,"The definition of ""good"" varies from person to...",Can You Get Life Insurance If You Skydive?,That's a great question! Most insurance compan...
96,Does Suze Orman Hate Whole Life Insurance?,Suze Orman usually does not recommend Whole Li...,Do Life Insurance Agents Really Care Or Do The...,Having been in this business for more than 30 ...
97,How Much Does It Cost To Add A Named Driver To...,This is nearly impossible to answer as the rat...,Is Mental Health Covered By Insurance?,Great question! One of the great things about ...
98,Is Disability Insurance The Same As Workers Co...,"No, they are not the same. Workers compensatio...",Can You Have Two Long Term Disability Insuranc...,Yes. Many people have two disability policies....


### We drop the two 'Answer' columns, and add Output column (with values 0, as False)

In [27]:
combined_sample = combined_sample.drop(combined_sample.columns[[1, 3]], axis=1)

In [28]:
combined_sample.columns = ['Question', 'Similar/Dissimilar']

In [29]:
combined_sample

Unnamed: 0,Question,Similar/Dissimilar
0,Where Do You Get Disability Insurance?,Is Long Term Disability Insurance The Same As ...
1,Does Each Tenant Need Renters Insurance?,Does Your Spouse Have To Be Your Beneficiary F...
2,Can Life Insurance Refuse To Pay?,How Much Is Enough Auto Insurance Coverage?
3,Does Long Term Care Insurance Cover Assisted L...,Is Long Term Care Insurance Regulated?
4,How Do I Choose A Medigap Plan?,Can You Change From Medicare Advantage To Medi...
...,...,...
95,What To Look For In A Good Health Insurance Plan?,Can You Get Life Insurance If You Skydive?
96,Does Suze Orman Hate Whole Life Insurance?,Do Life Insurance Agents Really Care Or Do The...
97,How Much Does It Cost To Add A Named Driver To...,Is Mental Health Covered By Insurance?
98,Is Disability Insurance The Same As Workers Co...,Can You Have Two Long Term Disability Insuranc...


In [30]:
combined_sample['Output'] = 0

In [31]:
combined_sample

Unnamed: 0,Question,Similar/Dissimilar,Output
0,Where Do You Get Disability Insurance?,Is Long Term Disability Insurance The Same As ...,0
1,Does Each Tenant Need Renters Insurance?,Does Your Spouse Have To Be Your Beneficiary F...,0
2,Can Life Insurance Refuse To Pay?,How Much Is Enough Auto Insurance Coverage?,0
3,Does Long Term Care Insurance Cover Assisted L...,Is Long Term Care Insurance Regulated?,0
4,How Do I Choose A Medigap Plan?,Can You Change From Medicare Advantage To Medi...,0
...,...,...,...
95,What To Look For In A Good Health Insurance Plan?,Can You Get Life Insurance If You Skydive?,0
96,Does Suze Orman Hate Whole Life Insurance?,Do Life Insurance Agents Really Care Or Do The...,0
97,How Much Does It Cost To Add A Named Driver To...,Is Mental Health Covered By Insurance?,0
98,Is Disability Insurance The Same As Workers Co...,Can You Have Two Long Term Disability Insuranc...,0


In [32]:
combined_sample.to_csv('combined_sample.csv', index=False)

### Inserting similar questions to dataset

In [34]:
similar_entries = combined_sample.copy()

In [35]:
similar_entries['Similar/Dissimilar'] = ''

In [36]:
similar_entries['Output'] = 1

In [37]:
similar_entries

Unnamed: 0,Question,Similar/Dissimilar,Output
0,Where Do You Get Disability Insurance?,,1
1,Does Each Tenant Need Renters Insurance?,,1
2,Can Life Insurance Refuse To Pay?,,1
3,Does Long Term Care Insurance Cover Assisted L...,,1
4,How Do I Choose A Medigap Plan?,,1
...,...,...,...
95,What To Look For In A Good Health Insurance Plan?,,1
96,Does Suze Orman Hate Whole Life Insurance?,,1
97,How Much Does It Cost To Add A Named Driver To...,,1
98,Is Disability Insurance The Same As Workers Co...,,1


In [39]:
combined_sample = pd.concat([combined_sample, similar_entries], ignore_index=True)

In [40]:
combined_sample

Unnamed: 0,Question,Similar/Dissimilar,Output
0,Where Do You Get Disability Insurance?,Is Long Term Disability Insurance The Same As ...,0
1,Does Each Tenant Need Renters Insurance?,Does Your Spouse Have To Be Your Beneficiary F...,0
2,Can Life Insurance Refuse To Pay?,How Much Is Enough Auto Insurance Coverage?,0
3,Does Long Term Care Insurance Cover Assisted L...,Is Long Term Care Insurance Regulated?,0
4,How Do I Choose A Medigap Plan?,Can You Change From Medicare Advantage To Medi...,0
...,...,...,...
195,What To Look For In A Good Health Insurance Plan?,,1
196,Does Suze Orman Hate Whole Life Insurance?,,1
197,How Much Does It Cost To Add A Named Driver To...,,1
198,Is Disability Insurance The Same As Workers Co...,,1


In [41]:
combined_sample.to_csv('combined_sample.csv', index=False)

### Now all that is left to complete similar questions is to populate them, using service like QuillBot