# Kaggle

https://www.kaggle.com/datasets/priyamchoksi/credit-card-transactions-dataset

# Importar bibliotecas

In [1]:
import os
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from datetime import datetime
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import MinMaxScaler, StandardScaler, RobustScaler
from sklearn.linear_model import LogisticRegression
from sklearn.ensemble import RandomForestClassifier
from sklearn.tree import DecisionTreeClassifier
from sklearn.neighbors import KNeighborsClassifier
from sklearn.metrics import classification_report, confusion_matrix, accuracy_score, ConfusionMatrixDisplay
from sklearn.metrics import auc, roc_curve, precision_score, recall_score, f1_score, RocCurveDisplay
from tqdm import tqdm
import tensorflow as tf

In [2]:
os.makedirs('Results', exist_ok=True)

In [3]:
TIPO_DE_TRANSFORMACAO = 'standardization' #robust ou min_max

# Configurar o Pandas para exibir todas as colunas

In [4]:
pd.set_option('display.max_columns', None)

In [5]:
df = pd.read_csv('./Dados/credit_card_transactions.csv')

In [6]:
df.head()

Unnamed: 0.1,Unnamed: 0,trans_date_trans_time,cc_num,merchant,category,amt,first,last,gender,street,city,state,zip,lat,long,city_pop,job,dob,trans_num,unix_time,merch_lat,merch_long,is_fraud,merch_zipcode
0,0,2019-01-01 00:00:18,2703186189652095,"fraud_Rippin, Kub and Mann",misc_net,4.97,Jennifer,Banks,F,561 Perry Cove,Moravian Falls,NC,28654,36.0788,-81.1781,3495,"Psychologist, counselling",1988-03-09,0b242abb623afc578575680df30655b9,1325376018,36.011293,-82.048315,0,28705.0
1,1,2019-01-01 00:00:44,630423337322,"fraud_Heller, Gutmann and Zieme",grocery_pos,107.23,Stephanie,Gill,F,43039 Riley Greens Suite 393,Orient,WA,99160,48.8878,-118.2105,149,Special educational needs teacher,1978-06-21,1f76529f8574734946361c461b024d99,1325376044,49.159047,-118.186462,0,
2,2,2019-01-01 00:00:51,38859492057661,fraud_Lind-Buckridge,entertainment,220.11,Edward,Sanchez,M,594 White Dale Suite 530,Malad City,ID,83252,42.1808,-112.262,4154,Nature conservation officer,1962-01-19,a1a22d70485983eac12b5b88dad1cf95,1325376051,43.150704,-112.154481,0,83236.0
3,3,2019-01-01 00:01:16,3534093764340240,"fraud_Kutch, Hermiston and Farrell",gas_transport,45.0,Jeremy,White,M,9443 Cynthia Court Apt. 038,Boulder,MT,59632,46.2306,-112.1138,1939,Patent attorney,1967-01-12,6b849c168bdad6f867558c3793159a81,1325376076,47.034331,-112.561071,0,
4,4,2019-01-01 00:03:06,375534208663984,fraud_Keeling-Crist,misc_pos,41.96,Tyler,Garcia,M,408 Bradley Rest,Doe Hill,VA,24433,38.4207,-79.4629,99,Dance movement psychotherapist,1986-03-28,a41d7549acf90789359a9aa5346dcb46,1325376186,38.674999,-78.632459,0,22844.0


# Exibir o formato dos dados

In [7]:
df.shape

(1296675, 24)

# Verificar dados nulos

In [8]:
df.isnull().sum()

Unnamed: 0                    0
trans_date_trans_time         0
cc_num                        0
merchant                      0
category                      0
amt                           0
first                         0
last                          0
gender                        0
street                        0
city                          0
state                         0
zip                           0
lat                           0
long                          0
city_pop                      0
job                           0
dob                           0
trans_num                     0
unix_time                     0
merch_lat                     0
merch_long                    0
is_fraud                      0
merch_zipcode            195973
dtype: int64

# Remover coluna Unnamed

In [9]:
df.drop('Unnamed: 0', axis=1, inplace=True)

In [10]:
df.head()

Unnamed: 0,trans_date_trans_time,cc_num,merchant,category,amt,first,last,gender,street,city,state,zip,lat,long,city_pop,job,dob,trans_num,unix_time,merch_lat,merch_long,is_fraud,merch_zipcode
0,2019-01-01 00:00:18,2703186189652095,"fraud_Rippin, Kub and Mann",misc_net,4.97,Jennifer,Banks,F,561 Perry Cove,Moravian Falls,NC,28654,36.0788,-81.1781,3495,"Psychologist, counselling",1988-03-09,0b242abb623afc578575680df30655b9,1325376018,36.011293,-82.048315,0,28705.0
1,2019-01-01 00:00:44,630423337322,"fraud_Heller, Gutmann and Zieme",grocery_pos,107.23,Stephanie,Gill,F,43039 Riley Greens Suite 393,Orient,WA,99160,48.8878,-118.2105,149,Special educational needs teacher,1978-06-21,1f76529f8574734946361c461b024d99,1325376044,49.159047,-118.186462,0,
2,2019-01-01 00:00:51,38859492057661,fraud_Lind-Buckridge,entertainment,220.11,Edward,Sanchez,M,594 White Dale Suite 530,Malad City,ID,83252,42.1808,-112.262,4154,Nature conservation officer,1962-01-19,a1a22d70485983eac12b5b88dad1cf95,1325376051,43.150704,-112.154481,0,83236.0
3,2019-01-01 00:01:16,3534093764340240,"fraud_Kutch, Hermiston and Farrell",gas_transport,45.0,Jeremy,White,M,9443 Cynthia Court Apt. 038,Boulder,MT,59632,46.2306,-112.1138,1939,Patent attorney,1967-01-12,6b849c168bdad6f867558c3793159a81,1325376076,47.034331,-112.561071,0,
4,2019-01-01 00:03:06,375534208663984,fraud_Keeling-Crist,misc_pos,41.96,Tyler,Garcia,M,408 Bradley Rest,Doe Hill,VA,24433,38.4207,-79.4629,99,Dance movement psychotherapist,1986-03-28,a41d7549acf90789359a9aa5346dcb46,1325376186,38.674999,-78.632459,0,22844.0


# Balancear os dados

In [11]:
df['is_fraud'].value_counts()

is_fraud
0    1289169
1       7506
Name: count, dtype: int64

In [12]:
fraud_index = np.arange(df['is_fraud'].value_counts()[1])
np.random.shuffle(fraud_index)

In [13]:
df_selected_index = df[df['is_fraud'] == 0].iloc[fraud_index].copy()
df_selected_index.reset_index(drop=True, inplace=True)

In [14]:
df = pd.concat([df[df['is_fraud'] == 1], df_selected_index], ignore_index=True)

# Converter as colunas de data de transação e data de nascimento de de String para Timestamp

In [15]:
df['trans_date_trans_time'] = df['trans_date_trans_time'].apply(lambda x : datetime.strptime(x, '%Y-%m-%d %H:%M:%S'))
df['dob'] = df['dob'].apply(lambda x : datetime.strptime(x, '%Y-%m-%d'))

In [16]:
df.head()

Unnamed: 0,trans_date_trans_time,cc_num,merchant,category,amt,first,last,gender,street,city,state,zip,lat,long,city_pop,job,dob,trans_num,unix_time,merch_lat,merch_long,is_fraud,merch_zipcode
0,2019-01-02 01:06:37,4613314721966,fraud_Rutherford-Mertz,grocery_pos,281.06,Jason,Murphy,M,542 Steve Curve Suite 011,Collettsville,NC,28611,35.9946,-81.7266,885,Soil scientist,1988-09-15,e8a81877ae9a0a7f883e15cb39dc4022,1325466397,36.430124,-81.179483,1,28644.0
1,2019-01-02 01:47:29,340187018810220,"fraud_Jenkins, Hauck and Friesen",gas_transport,11.52,Misty,Hart,F,27954 Hall Mill Suite 575,San Antonio,TX,78208,29.44,-98.459,1595797,Horticultural consultant,1960-10-28,bc7d41c41103877b03232f03f1f8d3f5,1325468849,29.819364,-99.142791,1,78055.0
2,2019-01-02 03:05:23,340187018810220,fraud_Goodwin-Nitzsche,grocery_pos,276.31,Misty,Hart,F,27954 Hall Mill Suite 575,San Antonio,TX,78208,29.44,-98.459,1595797,Horticultural consultant,1960-10-28,b98f12f4168391b2203238813df5aa8c,1325473523,29.273085,-98.83636,1,78039.0
3,2019-01-02 03:38:03,4613314721966,fraud_Erdman-Kertzmann,gas_transport,7.03,Jason,Murphy,M,542 Steve Curve Suite 011,Collettsville,NC,28611,35.9946,-81.7266,885,Soil scientist,1988-09-15,397894a5c4c02e3c61c784001f0f14e4,1325475483,35.909292,-82.09101,1,28777.0
4,2019-01-02 03:55:47,340187018810220,fraud_Koepp-Parker,grocery_pos,275.73,Misty,Hart,F,27954 Hall Mill Suite 575,San Antonio,TX,78208,29.44,-98.459,1595797,Horticultural consultant,1960-10-28,7863235a750d73a244c07f1fb7f0185a,1325476547,29.786426,-98.68341,1,78006.0


# Remover colunas

In [17]:
df.drop(['cc_num', 'merchant', 'first', 'last', 'street', 'city', 'state', 'zip', 'lat', 'long', 'trans_num', 'unix_time', 'merch_zipcode'], axis=1, inplace=True)

In [18]:
df.head()

Unnamed: 0,trans_date_trans_time,category,amt,gender,city_pop,job,dob,merch_lat,merch_long,is_fraud
0,2019-01-02 01:06:37,grocery_pos,281.06,M,885,Soil scientist,1988-09-15,36.430124,-81.179483,1
1,2019-01-02 01:47:29,gas_transport,11.52,F,1595797,Horticultural consultant,1960-10-28,29.819364,-99.142791,1
2,2019-01-02 03:05:23,grocery_pos,276.31,F,1595797,Horticultural consultant,1960-10-28,29.273085,-98.83636,1
3,2019-01-02 03:38:03,gas_transport,7.03,M,885,Soil scientist,1988-09-15,35.909292,-82.09101,1
4,2019-01-02 03:55:47,grocery_pos,275.73,F,1595797,Horticultural consultant,1960-10-28,29.786426,-98.68341,1


In [19]:
len(df['category'].unique())

14

In [20]:
len(df['job'].unique())

494

# Calcular as idades com base na data de nascimento (dob)

In [21]:
df['age'] = df['dob'].apply(lambda x : round((datetime.today()-x).days/365))

In [22]:
df.head()

Unnamed: 0,trans_date_trans_time,category,amt,gender,city_pop,job,dob,merch_lat,merch_long,is_fraud,age
0,2019-01-02 01:06:37,grocery_pos,281.06,M,885,Soil scientist,1988-09-15,36.430124,-81.179483,1,36
1,2019-01-02 01:47:29,gas_transport,11.52,F,1595797,Horticultural consultant,1960-10-28,29.819364,-99.142791,1,64
2,2019-01-02 03:05:23,grocery_pos,276.31,F,1595797,Horticultural consultant,1960-10-28,29.273085,-98.83636,1,64
3,2019-01-02 03:38:03,gas_transport,7.03,M,885,Soil scientist,1988-09-15,35.909292,-82.09101,1,36
4,2019-01-02 03:55:47,grocery_pos,275.73,F,1595797,Horticultural consultant,1960-10-28,29.786426,-98.68341,1,64


# Remover as colunas de data

In [23]:
df.drop(['trans_date_trans_time', 'dob'], axis=1, inplace=True)

In [24]:
df.head()

Unnamed: 0,category,amt,gender,city_pop,job,merch_lat,merch_long,is_fraud,age
0,grocery_pos,281.06,M,885,Soil scientist,36.430124,-81.179483,1,36
1,gas_transport,11.52,F,1595797,Horticultural consultant,29.819364,-99.142791,1,64
2,grocery_pos,276.31,F,1595797,Horticultural consultant,29.273085,-98.83636,1,64
3,gas_transport,7.03,M,885,Soil scientist,35.909292,-82.09101,1,36
4,grocery_pos,275.73,F,1595797,Horticultural consultant,29.786426,-98.68341,1,64


# Transformar as colunas category, job e gender

In [25]:
categorical_columns = pd.get_dummies(df[['category', 'job', 'gender']], drop_first=True, dtype=int)

In [26]:
df.drop(['category', 'job', 'gender'], axis=1, inplace=True)

In [27]:
df = pd.concat([df, categorical_columns], axis=1)

In [28]:
#df.rename(columns={'gender_M':'gender'}, inplace=True)

In [29]:
df.head()

Unnamed: 0,amt,city_pop,merch_lat,merch_long,is_fraud,age,category_food_dining,category_gas_transport,category_grocery_net,category_grocery_pos,category_health_fitness,category_home,category_kids_pets,category_misc_net,category_misc_pos,category_personal_care,category_shopping_net,category_shopping_pos,category_travel,"job_Accountant, chartered","job_Accountant, chartered certified","job_Accountant, chartered public finance",job_Accounting technician,job_Acupuncturist,job_Administrator,"job_Administrator, arts","job_Administrator, charities/voluntary organisations","job_Administrator, education","job_Administrator, local government",job_Advertising account executive,job_Advertising account planner,job_Advertising copywriter,job_Advice worker,job_Aeronautical engineer,job_Agricultural consultant,job_Aid worker,job_Air broker,job_Air cabin crew,job_Air traffic controller,job_Airline pilot,job_Ambulance person,job_Amenity horticulturist,job_Analytical chemist,job_Animal nutritionist,job_Animal technologist,job_Animator,job_Applications developer,job_Arboriculturist,job_Archaeologist,job_Architect,job_Architectural technologist,job_Archivist,job_Armed forces logistics/support/administrative officer,job_Armed forces technical officer,job_Armed forces training and education officer,job_Art gallery manager,job_Art therapist,job_Artist,job_Arts development officer,job_Associate Professor,job_Audiological scientist,job_Barista,job_Barrister,job_Barrister's clerk,"job_Biochemist, clinical",job_Biomedical engineer,job_Biomedical scientist,job_Bookseller,job_Broadcast engineer,job_Broadcast journalist,job_Broadcast presenter,job_Building control surveyor,job_Building services engineer,job_Building surveyor,"job_Buyer, industrial","job_Buyer, retail",job_Cabin crew,job_Call centre manager,job_Camera operator,job_Careers adviser,job_Careers information officer,job_Cartographer,job_Catering manager,job_Ceramics designer,job_Charity fundraiser,job_Charity officer,job_Chartered accountant,job_Chartered legal executive (England and Wales),job_Chartered loss adjuster,job_Chartered public finance accountant,job_Chemical engineer,"job_Chemist, analytical",job_Chief Executive Officer,job_Chief Financial Officer,job_Chief Marketing Officer,job_Chief Operating Officer,job_Chief Strategy Officer,job_Chief Technology Officer,job_Chief of Staff,job_Child psychotherapist,job_Chiropodist,job_Civil Service administrator,job_Civil Service fast streamer,"job_Civil engineer, contracting",job_Claims inspector/assessor,job_Clinical biochemist,job_Clinical cytogeneticist,job_Clinical psychologist,job_Clinical research associate,job_Clothing/textile technologist,job_Colour technologist,job_Commercial horticulturist,job_Commercial/residential surveyor,job_Commissioning editor,job_Communications engineer,job_Community arts worker,job_Community development worker,job_Community education officer,job_Community pharmacist,job_Company secretary,job_Comptroller,"job_Conservation officer, historic buildings","job_Conservator, furniture","job_Conservator, museum/gallery",job_Contracting civil engineer,job_Contractor,job_Control and instrumentation engineer,job_Copy,"job_Copywriter, advertising",job_Corporate investment banker,job_Counselling psychologist,job_Counsellor,job_Curator,job_Cytogeneticist,job_Dance movement psychotherapist,job_Dancer,job_Data scientist,job_Database administrator,job_Dealer,"job_Designer, ceramics/pottery","job_Designer, exhibition/display","job_Designer, furniture","job_Designer, industrial/product","job_Designer, interior/spatial","job_Designer, jewellery","job_Designer, multimedia","job_Designer, television/film set","job_Designer, textile","job_Development worker, community","job_Development worker, international aid",job_Diagnostic radiographer,job_Dispensing optician,"job_Doctor, general practice","job_Doctor, hospital",job_Drilling engineer,job_Early years teacher,job_Ecologist,job_Economist,"job_Editor, commissioning","job_Editor, film/video","job_Editor, magazine features",job_Education administrator,"job_Education officer, community","job_Education officer, museum",job_Educational psychologist,job_Electrical engineer,job_Electronics engineer,"job_Embryologist, clinical",job_Emergency planning/management officer,job_Energy engineer,job_Energy manager,"job_Engineer, aeronautical","job_Engineer, agricultural","job_Engineer, automotive","job_Engineer, biomedical","job_Engineer, broadcasting (operations)","job_Engineer, building services","job_Engineer, civil (consulting)","job_Engineer, civil (contracting)","job_Engineer, communications","job_Engineer, control and instrumentation","job_Engineer, drilling","job_Engineer, electronics","job_Engineer, land","job_Engineer, maintenance","job_Engineer, manufacturing","job_Engineer, materials","job_Engineer, mining","job_Engineer, petroleum","job_Engineer, production","job_Engineer, site","job_Engineer, structural","job_Engineer, technical sales",job_Engineering geologist,job_English as a foreign language teacher,job_English as a second language teacher,job_Environmental consultant,job_Environmental education officer,job_Environmental health practitioner,job_Environmental manager,job_Equality and diversity officer,job_Equities trader,job_Estate manager/land agent,job_Event organiser,job_Exercise physiologist,job_Exhibition designer,"job_Exhibitions officer, museum/gallery",job_Facilities manager,job_Farm manager,job_Field seismologist,job_Field trials officer,job_Film/video editor,job_Financial adviser,job_Financial trader,job_Fine artist,job_Firefighter,job_Fisheries officer,job_Fitness centre manager,job_Forensic psychologist,job_Forest/woodland manager,job_Freight forwarder,job_Furniture conservator/restorer,job_Furniture designer,job_Further education lecturer,job_Futures trader,job_Gaffer,job_Garment/textile technologist,job_General practice doctor,"job_Geneticist, molecular",job_Geochemist,"job_Geologist, engineering","job_Geologist, wellsite",job_Geophysicist/field seismologist,job_Geoscientist,job_Glass blower/designer,job_Health and safety adviser,job_Health physicist,job_Health promotion specialist,job_Health service manager,job_Health visitor,job_Herbalist,job_Heritage manager,job_Herpetologist,job_Higher education careers adviser,job_Historic buildings inspector/conservation officer,job_Homeopath,job_Horticultural consultant,job_Horticultural therapist,"job_Horticulturist, commercial",job_Hospital doctor,job_Hospital pharmacist,job_Hotel manager,job_Human resources officer,job_Hydrogeologist,job_Hydrographic surveyor,job_Hydrologist,job_IT consultant,job_IT trainer,job_Illustrator,job_Immigration officer,job_Immunologist,job_Industrial buyer,job_Industrial/product designer,job_Information officer,job_Information systems manager,job_Insurance broker,job_Insurance claims handler,job_Insurance risk surveyor,job_Insurance underwriter,job_Intelligence analyst,job_Interior and spatial designer,job_Interpreter,job_Investment analyst,"job_Investment banker, corporate","job_Investment banker, operational",job_Jewellery designer,"job_Journalist, newspaper",job_Land,job_Land/geomatics surveyor,job_Landscape architect,job_Lawyer,job_Learning disability nurse,job_Learning mentor,"job_Lecturer, further education","job_Lecturer, higher education",job_Legal secretary,job_Leisure centre manager,job_Lexicographer,"job_Librarian, academic","job_Librarian, public",job_Licensed conveyancer,job_Local government officer,job_Location manager,job_Logistics and distribution manager,"job_Loss adjuster, chartered",job_Magazine features editor,job_Magazine journalist,job_Maintenance engineer,job_Make,job_Management consultant,job_Manufacturing engineer,job_Manufacturing systems engineer,job_Market researcher,job_Marketing executive,job_Materials engineer,job_Mechanical engineer,job_Media buyer,job_Media planner,job_Medical physicist,job_Medical sales representative,job_Medical secretary,job_Medical technical officer,job_Mental health nurse,"job_Merchandiser, retail",job_Metallurgist,job_Minerals surveyor,job_Mining engineer,job_Mudlogger,job_Multimedia programmer,job_Museum education officer,job_Museum/gallery conservator,job_Museum/gallery exhibitions officer,job_Music therapist,job_Music tutor,job_Musician,job_Nature conservation officer,job_Naval architect,job_Network engineer,job_Neurosurgeon,"job_Nurse, children's","job_Nurse, mental health",job_Nutritional therapist,job_Occupational hygienist,job_Occupational psychologist,job_Occupational therapist,job_Oceanographer,job_Oncologist,job_Operational researcher,job_Operations geologist,"job_Optician, dispensing",job_Optometrist,job_Orthoptist,job_Osteopath,job_Outdoor activities/education manager,job_Paediatric nurse,job_Paramedic,job_Patent attorney,job_Pathologist,job_Pension scheme manager,job_Pensions consultant,job_Personnel officer,job_Petroleum engineer,"job_Pharmacist, community","job_Pharmacist, hospital",job_Pharmacologist,"job_Physicist, medical",job_Physiological scientist,job_Physiotherapist,job_Phytotherapist,"job_Pilot, airline",job_Planning and development surveyor,job_Plant breeder/geneticist,job_Podiatrist,job_Police officer,job_Politician's assistant,"job_Presenter, broadcasting",job_Press photographer,job_Press sub,job_Primary school teacher,job_Prison officer,job_Private music teacher,job_Probation officer,"job_Producer, radio","job_Producer, television/film/video",job_Product designer,job_Product manager,job_Product/process development scientist,"job_Production assistant, radio","job_Production assistant, television",job_Production engineer,job_Production manager,job_Professor Emeritus,"job_Programme researcher, broadcasting/film/video","job_Programmer, applications","job_Programmer, multimedia",job_Psychiatric nurse,job_Psychiatrist,"job_Psychologist, clinical","job_Psychologist, counselling","job_Psychologist, forensic","job_Psychologist, sport and exercise",job_Psychotherapist,"job_Psychotherapist, child",job_Public affairs consultant,job_Public house manager,job_Public librarian,job_Public relations account executive,job_Public relations officer,job_Purchasing manager,job_Quantity surveyor,job_Quarry manager,job_Race relations officer,job_Radio broadcast assistant,job_Radio producer,"job_Radiographer, diagnostic","job_Radiographer, therapeutic",job_Records manager,job_Regulatory affairs officer,"job_Research officer, political party","job_Research officer, trade union",job_Research scientist (life sciences),job_Research scientist (maths),job_Research scientist (medical),job_Research scientist (physical sciences),"job_Restaurant manager, fast food",job_Retail banker,job_Retail buyer,job_Retail manager,job_Retail merchandiser,job_Risk analyst,job_Rural practice surveyor,job_Sales executive,"job_Sales professional, IT",job_Sales promotion account executive,job_Science writer,job_Scientific laboratory technician,"job_Scientist, audiological","job_Scientist, biomedical","job_Scientist, clinical (histocompatibility and immunogenetics)","job_Scientist, marine","job_Scientist, physiological","job_Scientist, research (maths)","job_Scientist, research (medical)","job_Scientist, research (physical sciences)",job_Secondary school teacher,job_Secretary/administrator,job_Seismic interpreter,job_Senior tax professional/tax inspector,job_Set designer,job_Ship broker,job_Site engineer,"job_Social research officer, government",job_Social researcher,job_Soil scientist,job_Solicitor,"job_Solicitor, Scotland",job_Special educational needs teacher,job_Special effects artist,job_Sport and exercise psychologist,job_Sports administrator,job_Sports development officer,job_Stage manager,job_Statistician,job_Structural engineer,job_Sub,job_Surgeon,"job_Surveyor, hydrographic","job_Surveyor, land/geomatics","job_Surveyor, minerals","job_Surveyor, mining","job_Surveyor, rural practice",job_Systems analyst,job_Systems developer,job_TEFL teacher,job_Tax adviser,job_Tax inspector,"job_Teacher, English as a foreign language","job_Teacher, adult education","job_Teacher, early years/pre","job_Teacher, primary school","job_Teacher, secondary school","job_Teacher, special educational needs",job_Teaching laboratory technician,job_Technical brewer,job_Telecommunications researcher,job_Television camera operator,job_Television floor manager,job_Television production assistant,job_Television/film/video producer,job_Textile designer,job_Theatre director,job_Theatre manager,job_Theme park manager,"job_Therapist, art","job_Therapist, drama","job_Therapist, horticultural","job_Therapist, music","job_Therapist, occupational","job_Therapist, sports",job_Tour manager,job_Tourism officer,job_Tourist information centre manager,job_Town planner,job_Toxicologist,job_Trade mark attorney,job_Trading standards officer,job_Training and development officer,job_Transport planner,job_Travel agency manager,job_Tree surgeon,job_Veterinary surgeon,job_Video editor,job_Visual merchandiser,job_Volunteer coordinator,job_Warden/ranger,job_Warehouse manager,job_Waste management officer,job_Water engineer,job_Water quality scientist,job_Web designer,job_Wellsite geologist,job_Writer,gender_M
0,281.06,885,36.430124,-81.179483,1,36,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1
1,11.52,1595797,29.819364,-99.142791,1,64,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2,276.31,1595797,29.273085,-98.83636,1,64,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
3,7.03,885,35.909292,-82.09101,1,36,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1
4,275.73,1595797,29.786426,-98.68341,1,64,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [30]:
df.shape

(15012, 513)

# Separar os dados em treino e teste

In [31]:
is_fraud = df['is_fraud'].copy()

In [32]:
X = df.drop('is_fraud', axis=1).copy()
y = df['is_fraud'].copy()

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=0, stratify=is_fraud)
X_train.reset_index(drop=True, inplace=True)
X_test.reset_index(drop=True, inplace=True)
y_train.reset_index(drop=True, inplace=True)
y_test.reset_index(drop=True, inplace=True)

In [33]:
print(f'X treino shape: {X_train.shape}')
print(f'X teste shape: {X_test.shape}')

X treino shape: (10508, 512)
X teste shape: (4504, 512)


In [34]:
print(f'y treino shape: {y_train.shape}')
print(f'y teste shape: {y_test.shape}')

y treino shape: (10508,)
y teste shape: (4504,)


In [35]:
X_train.head()

Unnamed: 0,amt,city_pop,merch_lat,merch_long,age,category_food_dining,category_gas_transport,category_grocery_net,category_grocery_pos,category_health_fitness,category_home,category_kids_pets,category_misc_net,category_misc_pos,category_personal_care,category_shopping_net,category_shopping_pos,category_travel,"job_Accountant, chartered","job_Accountant, chartered certified","job_Accountant, chartered public finance",job_Accounting technician,job_Acupuncturist,job_Administrator,"job_Administrator, arts","job_Administrator, charities/voluntary organisations","job_Administrator, education","job_Administrator, local government",job_Advertising account executive,job_Advertising account planner,job_Advertising copywriter,job_Advice worker,job_Aeronautical engineer,job_Agricultural consultant,job_Aid worker,job_Air broker,job_Air cabin crew,job_Air traffic controller,job_Airline pilot,job_Ambulance person,job_Amenity horticulturist,job_Analytical chemist,job_Animal nutritionist,job_Animal technologist,job_Animator,job_Applications developer,job_Arboriculturist,job_Archaeologist,job_Architect,job_Architectural technologist,job_Archivist,job_Armed forces logistics/support/administrative officer,job_Armed forces technical officer,job_Armed forces training and education officer,job_Art gallery manager,job_Art therapist,job_Artist,job_Arts development officer,job_Associate Professor,job_Audiological scientist,job_Barista,job_Barrister,job_Barrister's clerk,"job_Biochemist, clinical",job_Biomedical engineer,job_Biomedical scientist,job_Bookseller,job_Broadcast engineer,job_Broadcast journalist,job_Broadcast presenter,job_Building control surveyor,job_Building services engineer,job_Building surveyor,"job_Buyer, industrial","job_Buyer, retail",job_Cabin crew,job_Call centre manager,job_Camera operator,job_Careers adviser,job_Careers information officer,job_Cartographer,job_Catering manager,job_Ceramics designer,job_Charity fundraiser,job_Charity officer,job_Chartered accountant,job_Chartered legal executive (England and Wales),job_Chartered loss adjuster,job_Chartered public finance accountant,job_Chemical engineer,"job_Chemist, analytical",job_Chief Executive Officer,job_Chief Financial Officer,job_Chief Marketing Officer,job_Chief Operating Officer,job_Chief Strategy Officer,job_Chief Technology Officer,job_Chief of Staff,job_Child psychotherapist,job_Chiropodist,job_Civil Service administrator,job_Civil Service fast streamer,"job_Civil engineer, contracting",job_Claims inspector/assessor,job_Clinical biochemist,job_Clinical cytogeneticist,job_Clinical psychologist,job_Clinical research associate,job_Clothing/textile technologist,job_Colour technologist,job_Commercial horticulturist,job_Commercial/residential surveyor,job_Commissioning editor,job_Communications engineer,job_Community arts worker,job_Community development worker,job_Community education officer,job_Community pharmacist,job_Company secretary,job_Comptroller,"job_Conservation officer, historic buildings","job_Conservator, furniture","job_Conservator, museum/gallery",job_Contracting civil engineer,job_Contractor,job_Control and instrumentation engineer,job_Copy,"job_Copywriter, advertising",job_Corporate investment banker,job_Counselling psychologist,job_Counsellor,job_Curator,job_Cytogeneticist,job_Dance movement psychotherapist,job_Dancer,job_Data scientist,job_Database administrator,job_Dealer,"job_Designer, ceramics/pottery","job_Designer, exhibition/display","job_Designer, furniture","job_Designer, industrial/product","job_Designer, interior/spatial","job_Designer, jewellery","job_Designer, multimedia","job_Designer, television/film set","job_Designer, textile","job_Development worker, community","job_Development worker, international aid",job_Diagnostic radiographer,job_Dispensing optician,"job_Doctor, general practice","job_Doctor, hospital",job_Drilling engineer,job_Early years teacher,job_Ecologist,job_Economist,"job_Editor, commissioning","job_Editor, film/video","job_Editor, magazine features",job_Education administrator,"job_Education officer, community","job_Education officer, museum",job_Educational psychologist,job_Electrical engineer,job_Electronics engineer,"job_Embryologist, clinical",job_Emergency planning/management officer,job_Energy engineer,job_Energy manager,"job_Engineer, aeronautical","job_Engineer, agricultural","job_Engineer, automotive","job_Engineer, biomedical","job_Engineer, broadcasting (operations)","job_Engineer, building services","job_Engineer, civil (consulting)","job_Engineer, civil (contracting)","job_Engineer, communications","job_Engineer, control and instrumentation","job_Engineer, drilling","job_Engineer, electronics","job_Engineer, land","job_Engineer, maintenance","job_Engineer, manufacturing","job_Engineer, materials","job_Engineer, mining","job_Engineer, petroleum","job_Engineer, production","job_Engineer, site","job_Engineer, structural","job_Engineer, technical sales",job_Engineering geologist,job_English as a foreign language teacher,job_English as a second language teacher,job_Environmental consultant,job_Environmental education officer,job_Environmental health practitioner,job_Environmental manager,job_Equality and diversity officer,job_Equities trader,job_Estate manager/land agent,job_Event organiser,job_Exercise physiologist,job_Exhibition designer,"job_Exhibitions officer, museum/gallery",job_Facilities manager,job_Farm manager,job_Field seismologist,job_Field trials officer,job_Film/video editor,job_Financial adviser,job_Financial trader,job_Fine artist,job_Firefighter,job_Fisheries officer,job_Fitness centre manager,job_Forensic psychologist,job_Forest/woodland manager,job_Freight forwarder,job_Furniture conservator/restorer,job_Furniture designer,job_Further education lecturer,job_Futures trader,job_Gaffer,job_Garment/textile technologist,job_General practice doctor,"job_Geneticist, molecular",job_Geochemist,"job_Geologist, engineering","job_Geologist, wellsite",job_Geophysicist/field seismologist,job_Geoscientist,job_Glass blower/designer,job_Health and safety adviser,job_Health physicist,job_Health promotion specialist,job_Health service manager,job_Health visitor,job_Herbalist,job_Heritage manager,job_Herpetologist,job_Higher education careers adviser,job_Historic buildings inspector/conservation officer,job_Homeopath,job_Horticultural consultant,job_Horticultural therapist,"job_Horticulturist, commercial",job_Hospital doctor,job_Hospital pharmacist,job_Hotel manager,job_Human resources officer,job_Hydrogeologist,job_Hydrographic surveyor,job_Hydrologist,job_IT consultant,job_IT trainer,job_Illustrator,job_Immigration officer,job_Immunologist,job_Industrial buyer,job_Industrial/product designer,job_Information officer,job_Information systems manager,job_Insurance broker,job_Insurance claims handler,job_Insurance risk surveyor,job_Insurance underwriter,job_Intelligence analyst,job_Interior and spatial designer,job_Interpreter,job_Investment analyst,"job_Investment banker, corporate","job_Investment banker, operational",job_Jewellery designer,"job_Journalist, newspaper",job_Land,job_Land/geomatics surveyor,job_Landscape architect,job_Lawyer,job_Learning disability nurse,job_Learning mentor,"job_Lecturer, further education","job_Lecturer, higher education",job_Legal secretary,job_Leisure centre manager,job_Lexicographer,"job_Librarian, academic","job_Librarian, public",job_Licensed conveyancer,job_Local government officer,job_Location manager,job_Logistics and distribution manager,"job_Loss adjuster, chartered",job_Magazine features editor,job_Magazine journalist,job_Maintenance engineer,job_Make,job_Management consultant,job_Manufacturing engineer,job_Manufacturing systems engineer,job_Market researcher,job_Marketing executive,job_Materials engineer,job_Mechanical engineer,job_Media buyer,job_Media planner,job_Medical physicist,job_Medical sales representative,job_Medical secretary,job_Medical technical officer,job_Mental health nurse,"job_Merchandiser, retail",job_Metallurgist,job_Minerals surveyor,job_Mining engineer,job_Mudlogger,job_Multimedia programmer,job_Museum education officer,job_Museum/gallery conservator,job_Museum/gallery exhibitions officer,job_Music therapist,job_Music tutor,job_Musician,job_Nature conservation officer,job_Naval architect,job_Network engineer,job_Neurosurgeon,"job_Nurse, children's","job_Nurse, mental health",job_Nutritional therapist,job_Occupational hygienist,job_Occupational psychologist,job_Occupational therapist,job_Oceanographer,job_Oncologist,job_Operational researcher,job_Operations geologist,"job_Optician, dispensing",job_Optometrist,job_Orthoptist,job_Osteopath,job_Outdoor activities/education manager,job_Paediatric nurse,job_Paramedic,job_Patent attorney,job_Pathologist,job_Pension scheme manager,job_Pensions consultant,job_Personnel officer,job_Petroleum engineer,"job_Pharmacist, community","job_Pharmacist, hospital",job_Pharmacologist,"job_Physicist, medical",job_Physiological scientist,job_Physiotherapist,job_Phytotherapist,"job_Pilot, airline",job_Planning and development surveyor,job_Plant breeder/geneticist,job_Podiatrist,job_Police officer,job_Politician's assistant,"job_Presenter, broadcasting",job_Press photographer,job_Press sub,job_Primary school teacher,job_Prison officer,job_Private music teacher,job_Probation officer,"job_Producer, radio","job_Producer, television/film/video",job_Product designer,job_Product manager,job_Product/process development scientist,"job_Production assistant, radio","job_Production assistant, television",job_Production engineer,job_Production manager,job_Professor Emeritus,"job_Programme researcher, broadcasting/film/video","job_Programmer, applications","job_Programmer, multimedia",job_Psychiatric nurse,job_Psychiatrist,"job_Psychologist, clinical","job_Psychologist, counselling","job_Psychologist, forensic","job_Psychologist, sport and exercise",job_Psychotherapist,"job_Psychotherapist, child",job_Public affairs consultant,job_Public house manager,job_Public librarian,job_Public relations account executive,job_Public relations officer,job_Purchasing manager,job_Quantity surveyor,job_Quarry manager,job_Race relations officer,job_Radio broadcast assistant,job_Radio producer,"job_Radiographer, diagnostic","job_Radiographer, therapeutic",job_Records manager,job_Regulatory affairs officer,"job_Research officer, political party","job_Research officer, trade union",job_Research scientist (life sciences),job_Research scientist (maths),job_Research scientist (medical),job_Research scientist (physical sciences),"job_Restaurant manager, fast food",job_Retail banker,job_Retail buyer,job_Retail manager,job_Retail merchandiser,job_Risk analyst,job_Rural practice surveyor,job_Sales executive,"job_Sales professional, IT",job_Sales promotion account executive,job_Science writer,job_Scientific laboratory technician,"job_Scientist, audiological","job_Scientist, biomedical","job_Scientist, clinical (histocompatibility and immunogenetics)","job_Scientist, marine","job_Scientist, physiological","job_Scientist, research (maths)","job_Scientist, research (medical)","job_Scientist, research (physical sciences)",job_Secondary school teacher,job_Secretary/administrator,job_Seismic interpreter,job_Senior tax professional/tax inspector,job_Set designer,job_Ship broker,job_Site engineer,"job_Social research officer, government",job_Social researcher,job_Soil scientist,job_Solicitor,"job_Solicitor, Scotland",job_Special educational needs teacher,job_Special effects artist,job_Sport and exercise psychologist,job_Sports administrator,job_Sports development officer,job_Stage manager,job_Statistician,job_Structural engineer,job_Sub,job_Surgeon,"job_Surveyor, hydrographic","job_Surveyor, land/geomatics","job_Surveyor, minerals","job_Surveyor, mining","job_Surveyor, rural practice",job_Systems analyst,job_Systems developer,job_TEFL teacher,job_Tax adviser,job_Tax inspector,"job_Teacher, English as a foreign language","job_Teacher, adult education","job_Teacher, early years/pre","job_Teacher, primary school","job_Teacher, secondary school","job_Teacher, special educational needs",job_Teaching laboratory technician,job_Technical brewer,job_Telecommunications researcher,job_Television camera operator,job_Television floor manager,job_Television production assistant,job_Television/film/video producer,job_Textile designer,job_Theatre director,job_Theatre manager,job_Theme park manager,"job_Therapist, art","job_Therapist, drama","job_Therapist, horticultural","job_Therapist, music","job_Therapist, occupational","job_Therapist, sports",job_Tour manager,job_Tourism officer,job_Tourist information centre manager,job_Town planner,job_Toxicologist,job_Trade mark attorney,job_Trading standards officer,job_Training and development officer,job_Transport planner,job_Travel agency manager,job_Tree surgeon,job_Veterinary surgeon,job_Video editor,job_Visual merchandiser,job_Volunteer coordinator,job_Warden/ranger,job_Warehouse manager,job_Waste management officer,job_Water engineer,job_Water quality scientist,job_Web designer,job_Wellsite geologist,job_Writer,gender_M
0,53.32,372,44.367747,-85.586295,29,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
1,66.64,1087,43.671828,-92.861168,61,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1
2,935.13,16955,45.543601,-118.293693,63,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
3,16.47,516,47.77641,-95.18304,58,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
4,940.89,737,40.721802,-74.620721,37,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1


In [36]:
X_test.head()

Unnamed: 0,amt,city_pop,merch_lat,merch_long,age,category_food_dining,category_gas_transport,category_grocery_net,category_grocery_pos,category_health_fitness,category_home,category_kids_pets,category_misc_net,category_misc_pos,category_personal_care,category_shopping_net,category_shopping_pos,category_travel,"job_Accountant, chartered","job_Accountant, chartered certified","job_Accountant, chartered public finance",job_Accounting technician,job_Acupuncturist,job_Administrator,"job_Administrator, arts","job_Administrator, charities/voluntary organisations","job_Administrator, education","job_Administrator, local government",job_Advertising account executive,job_Advertising account planner,job_Advertising copywriter,job_Advice worker,job_Aeronautical engineer,job_Agricultural consultant,job_Aid worker,job_Air broker,job_Air cabin crew,job_Air traffic controller,job_Airline pilot,job_Ambulance person,job_Amenity horticulturist,job_Analytical chemist,job_Animal nutritionist,job_Animal technologist,job_Animator,job_Applications developer,job_Arboriculturist,job_Archaeologist,job_Architect,job_Architectural technologist,job_Archivist,job_Armed forces logistics/support/administrative officer,job_Armed forces technical officer,job_Armed forces training and education officer,job_Art gallery manager,job_Art therapist,job_Artist,job_Arts development officer,job_Associate Professor,job_Audiological scientist,job_Barista,job_Barrister,job_Barrister's clerk,"job_Biochemist, clinical",job_Biomedical engineer,job_Biomedical scientist,job_Bookseller,job_Broadcast engineer,job_Broadcast journalist,job_Broadcast presenter,job_Building control surveyor,job_Building services engineer,job_Building surveyor,"job_Buyer, industrial","job_Buyer, retail",job_Cabin crew,job_Call centre manager,job_Camera operator,job_Careers adviser,job_Careers information officer,job_Cartographer,job_Catering manager,job_Ceramics designer,job_Charity fundraiser,job_Charity officer,job_Chartered accountant,job_Chartered legal executive (England and Wales),job_Chartered loss adjuster,job_Chartered public finance accountant,job_Chemical engineer,"job_Chemist, analytical",job_Chief Executive Officer,job_Chief Financial Officer,job_Chief Marketing Officer,job_Chief Operating Officer,job_Chief Strategy Officer,job_Chief Technology Officer,job_Chief of Staff,job_Child psychotherapist,job_Chiropodist,job_Civil Service administrator,job_Civil Service fast streamer,"job_Civil engineer, contracting",job_Claims inspector/assessor,job_Clinical biochemist,job_Clinical cytogeneticist,job_Clinical psychologist,job_Clinical research associate,job_Clothing/textile technologist,job_Colour technologist,job_Commercial horticulturist,job_Commercial/residential surveyor,job_Commissioning editor,job_Communications engineer,job_Community arts worker,job_Community development worker,job_Community education officer,job_Community pharmacist,job_Company secretary,job_Comptroller,"job_Conservation officer, historic buildings","job_Conservator, furniture","job_Conservator, museum/gallery",job_Contracting civil engineer,job_Contractor,job_Control and instrumentation engineer,job_Copy,"job_Copywriter, advertising",job_Corporate investment banker,job_Counselling psychologist,job_Counsellor,job_Curator,job_Cytogeneticist,job_Dance movement psychotherapist,job_Dancer,job_Data scientist,job_Database administrator,job_Dealer,"job_Designer, ceramics/pottery","job_Designer, exhibition/display","job_Designer, furniture","job_Designer, industrial/product","job_Designer, interior/spatial","job_Designer, jewellery","job_Designer, multimedia","job_Designer, television/film set","job_Designer, textile","job_Development worker, community","job_Development worker, international aid",job_Diagnostic radiographer,job_Dispensing optician,"job_Doctor, general practice","job_Doctor, hospital",job_Drilling engineer,job_Early years teacher,job_Ecologist,job_Economist,"job_Editor, commissioning","job_Editor, film/video","job_Editor, magazine features",job_Education administrator,"job_Education officer, community","job_Education officer, museum",job_Educational psychologist,job_Electrical engineer,job_Electronics engineer,"job_Embryologist, clinical",job_Emergency planning/management officer,job_Energy engineer,job_Energy manager,"job_Engineer, aeronautical","job_Engineer, agricultural","job_Engineer, automotive","job_Engineer, biomedical","job_Engineer, broadcasting (operations)","job_Engineer, building services","job_Engineer, civil (consulting)","job_Engineer, civil (contracting)","job_Engineer, communications","job_Engineer, control and instrumentation","job_Engineer, drilling","job_Engineer, electronics","job_Engineer, land","job_Engineer, maintenance","job_Engineer, manufacturing","job_Engineer, materials","job_Engineer, mining","job_Engineer, petroleum","job_Engineer, production","job_Engineer, site","job_Engineer, structural","job_Engineer, technical sales",job_Engineering geologist,job_English as a foreign language teacher,job_English as a second language teacher,job_Environmental consultant,job_Environmental education officer,job_Environmental health practitioner,job_Environmental manager,job_Equality and diversity officer,job_Equities trader,job_Estate manager/land agent,job_Event organiser,job_Exercise physiologist,job_Exhibition designer,"job_Exhibitions officer, museum/gallery",job_Facilities manager,job_Farm manager,job_Field seismologist,job_Field trials officer,job_Film/video editor,job_Financial adviser,job_Financial trader,job_Fine artist,job_Firefighter,job_Fisheries officer,job_Fitness centre manager,job_Forensic psychologist,job_Forest/woodland manager,job_Freight forwarder,job_Furniture conservator/restorer,job_Furniture designer,job_Further education lecturer,job_Futures trader,job_Gaffer,job_Garment/textile technologist,job_General practice doctor,"job_Geneticist, molecular",job_Geochemist,"job_Geologist, engineering","job_Geologist, wellsite",job_Geophysicist/field seismologist,job_Geoscientist,job_Glass blower/designer,job_Health and safety adviser,job_Health physicist,job_Health promotion specialist,job_Health service manager,job_Health visitor,job_Herbalist,job_Heritage manager,job_Herpetologist,job_Higher education careers adviser,job_Historic buildings inspector/conservation officer,job_Homeopath,job_Horticultural consultant,job_Horticultural therapist,"job_Horticulturist, commercial",job_Hospital doctor,job_Hospital pharmacist,job_Hotel manager,job_Human resources officer,job_Hydrogeologist,job_Hydrographic surveyor,job_Hydrologist,job_IT consultant,job_IT trainer,job_Illustrator,job_Immigration officer,job_Immunologist,job_Industrial buyer,job_Industrial/product designer,job_Information officer,job_Information systems manager,job_Insurance broker,job_Insurance claims handler,job_Insurance risk surveyor,job_Insurance underwriter,job_Intelligence analyst,job_Interior and spatial designer,job_Interpreter,job_Investment analyst,"job_Investment banker, corporate","job_Investment banker, operational",job_Jewellery designer,"job_Journalist, newspaper",job_Land,job_Land/geomatics surveyor,job_Landscape architect,job_Lawyer,job_Learning disability nurse,job_Learning mentor,"job_Lecturer, further education","job_Lecturer, higher education",job_Legal secretary,job_Leisure centre manager,job_Lexicographer,"job_Librarian, academic","job_Librarian, public",job_Licensed conveyancer,job_Local government officer,job_Location manager,job_Logistics and distribution manager,"job_Loss adjuster, chartered",job_Magazine features editor,job_Magazine journalist,job_Maintenance engineer,job_Make,job_Management consultant,job_Manufacturing engineer,job_Manufacturing systems engineer,job_Market researcher,job_Marketing executive,job_Materials engineer,job_Mechanical engineer,job_Media buyer,job_Media planner,job_Medical physicist,job_Medical sales representative,job_Medical secretary,job_Medical technical officer,job_Mental health nurse,"job_Merchandiser, retail",job_Metallurgist,job_Minerals surveyor,job_Mining engineer,job_Mudlogger,job_Multimedia programmer,job_Museum education officer,job_Museum/gallery conservator,job_Museum/gallery exhibitions officer,job_Music therapist,job_Music tutor,job_Musician,job_Nature conservation officer,job_Naval architect,job_Network engineer,job_Neurosurgeon,"job_Nurse, children's","job_Nurse, mental health",job_Nutritional therapist,job_Occupational hygienist,job_Occupational psychologist,job_Occupational therapist,job_Oceanographer,job_Oncologist,job_Operational researcher,job_Operations geologist,"job_Optician, dispensing",job_Optometrist,job_Orthoptist,job_Osteopath,job_Outdoor activities/education manager,job_Paediatric nurse,job_Paramedic,job_Patent attorney,job_Pathologist,job_Pension scheme manager,job_Pensions consultant,job_Personnel officer,job_Petroleum engineer,"job_Pharmacist, community","job_Pharmacist, hospital",job_Pharmacologist,"job_Physicist, medical",job_Physiological scientist,job_Physiotherapist,job_Phytotherapist,"job_Pilot, airline",job_Planning and development surveyor,job_Plant breeder/geneticist,job_Podiatrist,job_Police officer,job_Politician's assistant,"job_Presenter, broadcasting",job_Press photographer,job_Press sub,job_Primary school teacher,job_Prison officer,job_Private music teacher,job_Probation officer,"job_Producer, radio","job_Producer, television/film/video",job_Product designer,job_Product manager,job_Product/process development scientist,"job_Production assistant, radio","job_Production assistant, television",job_Production engineer,job_Production manager,job_Professor Emeritus,"job_Programme researcher, broadcasting/film/video","job_Programmer, applications","job_Programmer, multimedia",job_Psychiatric nurse,job_Psychiatrist,"job_Psychologist, clinical","job_Psychologist, counselling","job_Psychologist, forensic","job_Psychologist, sport and exercise",job_Psychotherapist,"job_Psychotherapist, child",job_Public affairs consultant,job_Public house manager,job_Public librarian,job_Public relations account executive,job_Public relations officer,job_Purchasing manager,job_Quantity surveyor,job_Quarry manager,job_Race relations officer,job_Radio broadcast assistant,job_Radio producer,"job_Radiographer, diagnostic","job_Radiographer, therapeutic",job_Records manager,job_Regulatory affairs officer,"job_Research officer, political party","job_Research officer, trade union",job_Research scientist (life sciences),job_Research scientist (maths),job_Research scientist (medical),job_Research scientist (physical sciences),"job_Restaurant manager, fast food",job_Retail banker,job_Retail buyer,job_Retail manager,job_Retail merchandiser,job_Risk analyst,job_Rural practice surveyor,job_Sales executive,"job_Sales professional, IT",job_Sales promotion account executive,job_Science writer,job_Scientific laboratory technician,"job_Scientist, audiological","job_Scientist, biomedical","job_Scientist, clinical (histocompatibility and immunogenetics)","job_Scientist, marine","job_Scientist, physiological","job_Scientist, research (maths)","job_Scientist, research (medical)","job_Scientist, research (physical sciences)",job_Secondary school teacher,job_Secretary/administrator,job_Seismic interpreter,job_Senior tax professional/tax inspector,job_Set designer,job_Ship broker,job_Site engineer,"job_Social research officer, government",job_Social researcher,job_Soil scientist,job_Solicitor,"job_Solicitor, Scotland",job_Special educational needs teacher,job_Special effects artist,job_Sport and exercise psychologist,job_Sports administrator,job_Sports development officer,job_Stage manager,job_Statistician,job_Structural engineer,job_Sub,job_Surgeon,"job_Surveyor, hydrographic","job_Surveyor, land/geomatics","job_Surveyor, minerals","job_Surveyor, mining","job_Surveyor, rural practice",job_Systems analyst,job_Systems developer,job_TEFL teacher,job_Tax adviser,job_Tax inspector,"job_Teacher, English as a foreign language","job_Teacher, adult education","job_Teacher, early years/pre","job_Teacher, primary school","job_Teacher, secondary school","job_Teacher, special educational needs",job_Teaching laboratory technician,job_Technical brewer,job_Telecommunications researcher,job_Television camera operator,job_Television floor manager,job_Television production assistant,job_Television/film/video producer,job_Textile designer,job_Theatre director,job_Theatre manager,job_Theme park manager,"job_Therapist, art","job_Therapist, drama","job_Therapist, horticultural","job_Therapist, music","job_Therapist, occupational","job_Therapist, sports",job_Tour manager,job_Tourism officer,job_Tourist information centre manager,job_Town planner,job_Toxicologist,job_Trade mark attorney,job_Trading standards officer,job_Training and development officer,job_Transport planner,job_Travel agency manager,job_Tree surgeon,job_Veterinary surgeon,job_Video editor,job_Visual merchandiser,job_Volunteer coordinator,job_Warden/ranger,job_Warehouse manager,job_Waste management officer,job_Water engineer,job_Water quality scientist,job_Web designer,job_Wellsite geologist,job_Writer,gender_M
0,250.77,928,42.94698,-88.583143,39,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1
1,61.08,205,40.134218,-88.075605,65,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2,67.42,2457,30.418121,-95.410587,43,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1
3,8.06,1087,43.6287,-94.120707,61,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1
4,138.38,3994,37.008141,-81.411206,88,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


# Aplicar transformações aos dados

In [37]:
if TIPO_DE_TRANSFORMACAO == 'standardization':
    scaler = StandardScaler()
elif TIPO_DE_TRANSFORMACAO == 'min_max':
    scaler = MinMaxScaler()
else:
    scaler = RobustScaler()

In [38]:
remove_columns = list(categorical_columns.columns)

data_train = scaler.fit_transform(X_train.drop(remove_columns, axis=1))
X_train_transformed = pd.DataFrame(data=data_train, columns=X_train.drop(remove_columns, axis=1).columns)
X_train_transformed = pd.concat([X_train_transformed, X_train[remove_columns]], axis=1)

data_test = scaler.transform(X_test.drop(remove_columns, axis=1))
X_test_transformed = pd.DataFrame(data=data_test, columns=X_test.drop(remove_columns, axis=1).columns)
X_test_transformed = pd.concat([X_test_transformed, X_test[remove_columns]], axis=1)

In [39]:
X_train_transformed.head()

Unnamed: 0,amt,city_pop,merch_lat,merch_long,age,category_food_dining,category_gas_transport,category_grocery_net,category_grocery_pos,category_health_fitness,category_home,category_kids_pets,category_misc_net,category_misc_pos,category_personal_care,category_shopping_net,category_shopping_pos,category_travel,"job_Accountant, chartered","job_Accountant, chartered certified","job_Accountant, chartered public finance",job_Accounting technician,job_Acupuncturist,job_Administrator,"job_Administrator, arts","job_Administrator, charities/voluntary organisations","job_Administrator, education","job_Administrator, local government",job_Advertising account executive,job_Advertising account planner,job_Advertising copywriter,job_Advice worker,job_Aeronautical engineer,job_Agricultural consultant,job_Aid worker,job_Air broker,job_Air cabin crew,job_Air traffic controller,job_Airline pilot,job_Ambulance person,job_Amenity horticulturist,job_Analytical chemist,job_Animal nutritionist,job_Animal technologist,job_Animator,job_Applications developer,job_Arboriculturist,job_Archaeologist,job_Architect,job_Architectural technologist,job_Archivist,job_Armed forces logistics/support/administrative officer,job_Armed forces technical officer,job_Armed forces training and education officer,job_Art gallery manager,job_Art therapist,job_Artist,job_Arts development officer,job_Associate Professor,job_Audiological scientist,job_Barista,job_Barrister,job_Barrister's clerk,"job_Biochemist, clinical",job_Biomedical engineer,job_Biomedical scientist,job_Bookseller,job_Broadcast engineer,job_Broadcast journalist,job_Broadcast presenter,job_Building control surveyor,job_Building services engineer,job_Building surveyor,"job_Buyer, industrial","job_Buyer, retail",job_Cabin crew,job_Call centre manager,job_Camera operator,job_Careers adviser,job_Careers information officer,job_Cartographer,job_Catering manager,job_Ceramics designer,job_Charity fundraiser,job_Charity officer,job_Chartered accountant,job_Chartered legal executive (England and Wales),job_Chartered loss adjuster,job_Chartered public finance accountant,job_Chemical engineer,"job_Chemist, analytical",job_Chief Executive Officer,job_Chief Financial Officer,job_Chief Marketing Officer,job_Chief Operating Officer,job_Chief Strategy Officer,job_Chief Technology Officer,job_Chief of Staff,job_Child psychotherapist,job_Chiropodist,job_Civil Service administrator,job_Civil Service fast streamer,"job_Civil engineer, contracting",job_Claims inspector/assessor,job_Clinical biochemist,job_Clinical cytogeneticist,job_Clinical psychologist,job_Clinical research associate,job_Clothing/textile technologist,job_Colour technologist,job_Commercial horticulturist,job_Commercial/residential surveyor,job_Commissioning editor,job_Communications engineer,job_Community arts worker,job_Community development worker,job_Community education officer,job_Community pharmacist,job_Company secretary,job_Comptroller,"job_Conservation officer, historic buildings","job_Conservator, furniture","job_Conservator, museum/gallery",job_Contracting civil engineer,job_Contractor,job_Control and instrumentation engineer,job_Copy,"job_Copywriter, advertising",job_Corporate investment banker,job_Counselling psychologist,job_Counsellor,job_Curator,job_Cytogeneticist,job_Dance movement psychotherapist,job_Dancer,job_Data scientist,job_Database administrator,job_Dealer,"job_Designer, ceramics/pottery","job_Designer, exhibition/display","job_Designer, furniture","job_Designer, industrial/product","job_Designer, interior/spatial","job_Designer, jewellery","job_Designer, multimedia","job_Designer, television/film set","job_Designer, textile","job_Development worker, community","job_Development worker, international aid",job_Diagnostic radiographer,job_Dispensing optician,"job_Doctor, general practice","job_Doctor, hospital",job_Drilling engineer,job_Early years teacher,job_Ecologist,job_Economist,"job_Editor, commissioning","job_Editor, film/video","job_Editor, magazine features",job_Education administrator,"job_Education officer, community","job_Education officer, museum",job_Educational psychologist,job_Electrical engineer,job_Electronics engineer,"job_Embryologist, clinical",job_Emergency planning/management officer,job_Energy engineer,job_Energy manager,"job_Engineer, aeronautical","job_Engineer, agricultural","job_Engineer, automotive","job_Engineer, biomedical","job_Engineer, broadcasting (operations)","job_Engineer, building services","job_Engineer, civil (consulting)","job_Engineer, civil (contracting)","job_Engineer, communications","job_Engineer, control and instrumentation","job_Engineer, drilling","job_Engineer, electronics","job_Engineer, land","job_Engineer, maintenance","job_Engineer, manufacturing","job_Engineer, materials","job_Engineer, mining","job_Engineer, petroleum","job_Engineer, production","job_Engineer, site","job_Engineer, structural","job_Engineer, technical sales",job_Engineering geologist,job_English as a foreign language teacher,job_English as a second language teacher,job_Environmental consultant,job_Environmental education officer,job_Environmental health practitioner,job_Environmental manager,job_Equality and diversity officer,job_Equities trader,job_Estate manager/land agent,job_Event organiser,job_Exercise physiologist,job_Exhibition designer,"job_Exhibitions officer, museum/gallery",job_Facilities manager,job_Farm manager,job_Field seismologist,job_Field trials officer,job_Film/video editor,job_Financial adviser,job_Financial trader,job_Fine artist,job_Firefighter,job_Fisheries officer,job_Fitness centre manager,job_Forensic psychologist,job_Forest/woodland manager,job_Freight forwarder,job_Furniture conservator/restorer,job_Furniture designer,job_Further education lecturer,job_Futures trader,job_Gaffer,job_Garment/textile technologist,job_General practice doctor,"job_Geneticist, molecular",job_Geochemist,"job_Geologist, engineering","job_Geologist, wellsite",job_Geophysicist/field seismologist,job_Geoscientist,job_Glass blower/designer,job_Health and safety adviser,job_Health physicist,job_Health promotion specialist,job_Health service manager,job_Health visitor,job_Herbalist,job_Heritage manager,job_Herpetologist,job_Higher education careers adviser,job_Historic buildings inspector/conservation officer,job_Homeopath,job_Horticultural consultant,job_Horticultural therapist,"job_Horticulturist, commercial",job_Hospital doctor,job_Hospital pharmacist,job_Hotel manager,job_Human resources officer,job_Hydrogeologist,job_Hydrographic surveyor,job_Hydrologist,job_IT consultant,job_IT trainer,job_Illustrator,job_Immigration officer,job_Immunologist,job_Industrial buyer,job_Industrial/product designer,job_Information officer,job_Information systems manager,job_Insurance broker,job_Insurance claims handler,job_Insurance risk surveyor,job_Insurance underwriter,job_Intelligence analyst,job_Interior and spatial designer,job_Interpreter,job_Investment analyst,"job_Investment banker, corporate","job_Investment banker, operational",job_Jewellery designer,"job_Journalist, newspaper",job_Land,job_Land/geomatics surveyor,job_Landscape architect,job_Lawyer,job_Learning disability nurse,job_Learning mentor,"job_Lecturer, further education","job_Lecturer, higher education",job_Legal secretary,job_Leisure centre manager,job_Lexicographer,"job_Librarian, academic","job_Librarian, public",job_Licensed conveyancer,job_Local government officer,job_Location manager,job_Logistics and distribution manager,"job_Loss adjuster, chartered",job_Magazine features editor,job_Magazine journalist,job_Maintenance engineer,job_Make,job_Management consultant,job_Manufacturing engineer,job_Manufacturing systems engineer,job_Market researcher,job_Marketing executive,job_Materials engineer,job_Mechanical engineer,job_Media buyer,job_Media planner,job_Medical physicist,job_Medical sales representative,job_Medical secretary,job_Medical technical officer,job_Mental health nurse,"job_Merchandiser, retail",job_Metallurgist,job_Minerals surveyor,job_Mining engineer,job_Mudlogger,job_Multimedia programmer,job_Museum education officer,job_Museum/gallery conservator,job_Museum/gallery exhibitions officer,job_Music therapist,job_Music tutor,job_Musician,job_Nature conservation officer,job_Naval architect,job_Network engineer,job_Neurosurgeon,"job_Nurse, children's","job_Nurse, mental health",job_Nutritional therapist,job_Occupational hygienist,job_Occupational psychologist,job_Occupational therapist,job_Oceanographer,job_Oncologist,job_Operational researcher,job_Operations geologist,"job_Optician, dispensing",job_Optometrist,job_Orthoptist,job_Osteopath,job_Outdoor activities/education manager,job_Paediatric nurse,job_Paramedic,job_Patent attorney,job_Pathologist,job_Pension scheme manager,job_Pensions consultant,job_Personnel officer,job_Petroleum engineer,"job_Pharmacist, community","job_Pharmacist, hospital",job_Pharmacologist,"job_Physicist, medical",job_Physiological scientist,job_Physiotherapist,job_Phytotherapist,"job_Pilot, airline",job_Planning and development surveyor,job_Plant breeder/geneticist,job_Podiatrist,job_Police officer,job_Politician's assistant,"job_Presenter, broadcasting",job_Press photographer,job_Press sub,job_Primary school teacher,job_Prison officer,job_Private music teacher,job_Probation officer,"job_Producer, radio","job_Producer, television/film/video",job_Product designer,job_Product manager,job_Product/process development scientist,"job_Production assistant, radio","job_Production assistant, television",job_Production engineer,job_Production manager,job_Professor Emeritus,"job_Programme researcher, broadcasting/film/video","job_Programmer, applications","job_Programmer, multimedia",job_Psychiatric nurse,job_Psychiatrist,"job_Psychologist, clinical","job_Psychologist, counselling","job_Psychologist, forensic","job_Psychologist, sport and exercise",job_Psychotherapist,"job_Psychotherapist, child",job_Public affairs consultant,job_Public house manager,job_Public librarian,job_Public relations account executive,job_Public relations officer,job_Purchasing manager,job_Quantity surveyor,job_Quarry manager,job_Race relations officer,job_Radio broadcast assistant,job_Radio producer,"job_Radiographer, diagnostic","job_Radiographer, therapeutic",job_Records manager,job_Regulatory affairs officer,"job_Research officer, political party","job_Research officer, trade union",job_Research scientist (life sciences),job_Research scientist (maths),job_Research scientist (medical),job_Research scientist (physical sciences),"job_Restaurant manager, fast food",job_Retail banker,job_Retail buyer,job_Retail manager,job_Retail merchandiser,job_Risk analyst,job_Rural practice surveyor,job_Sales executive,"job_Sales professional, IT",job_Sales promotion account executive,job_Science writer,job_Scientific laboratory technician,"job_Scientist, audiological","job_Scientist, biomedical","job_Scientist, clinical (histocompatibility and immunogenetics)","job_Scientist, marine","job_Scientist, physiological","job_Scientist, research (maths)","job_Scientist, research (medical)","job_Scientist, research (physical sciences)",job_Secondary school teacher,job_Secretary/administrator,job_Seismic interpreter,job_Senior tax professional/tax inspector,job_Set designer,job_Ship broker,job_Site engineer,"job_Social research officer, government",job_Social researcher,job_Soil scientist,job_Solicitor,"job_Solicitor, Scotland",job_Special educational needs teacher,job_Special effects artist,job_Sport and exercise psychologist,job_Sports administrator,job_Sports development officer,job_Stage manager,job_Statistician,job_Structural engineer,job_Sub,job_Surgeon,"job_Surveyor, hydrographic","job_Surveyor, land/geomatics","job_Surveyor, minerals","job_Surveyor, mining","job_Surveyor, rural practice",job_Systems analyst,job_Systems developer,job_TEFL teacher,job_Tax adviser,job_Tax inspector,"job_Teacher, English as a foreign language","job_Teacher, adult education","job_Teacher, early years/pre","job_Teacher, primary school","job_Teacher, secondary school","job_Teacher, special educational needs",job_Teaching laboratory technician,job_Technical brewer,job_Telecommunications researcher,job_Television camera operator,job_Television floor manager,job_Television production assistant,job_Television/film/video producer,job_Textile designer,job_Theatre director,job_Theatre manager,job_Theme park manager,"job_Therapist, art","job_Therapist, drama","job_Therapist, horticultural","job_Therapist, music","job_Therapist, occupational","job_Therapist, sports",job_Tour manager,job_Tourism officer,job_Tourist information centre manager,job_Town planner,job_Toxicologist,job_Trade mark attorney,job_Trading standards officer,job_Training and development officer,job_Transport planner,job_Travel agency manager,job_Tree surgeon,job_Veterinary surgeon,job_Video editor,job_Visual merchandiser,job_Volunteer coordinator,job_Warden/ranger,job_Warehouse manager,job_Waste management officer,job_Water engineer,job_Water quality scientist,job_Web designer,job_Wellsite geologist,job_Writer,gender_M
0,-0.6657,-0.296709,1.112394,0.324619,-1.305541,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
1,-0.62944,-0.294265,0.977763,-0.184545,0.467249,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1
2,1.734776,-0.240022,1.33987,-1.964553,0.578048,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
3,-0.766013,-0.296217,1.771822,-0.347052,0.30105,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
4,1.750456,-0.295461,0.407062,1.092094,-0.862343,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1


In [40]:
X_test_transformed.head()

Unnamed: 0,amt,city_pop,merch_lat,merch_long,age,category_food_dining,category_gas_transport,category_grocery_net,category_grocery_pos,category_health_fitness,category_home,category_kids_pets,category_misc_net,category_misc_pos,category_personal_care,category_shopping_net,category_shopping_pos,category_travel,"job_Accountant, chartered","job_Accountant, chartered certified","job_Accountant, chartered public finance",job_Accounting technician,job_Acupuncturist,job_Administrator,"job_Administrator, arts","job_Administrator, charities/voluntary organisations","job_Administrator, education","job_Administrator, local government",job_Advertising account executive,job_Advertising account planner,job_Advertising copywriter,job_Advice worker,job_Aeronautical engineer,job_Agricultural consultant,job_Aid worker,job_Air broker,job_Air cabin crew,job_Air traffic controller,job_Airline pilot,job_Ambulance person,job_Amenity horticulturist,job_Analytical chemist,job_Animal nutritionist,job_Animal technologist,job_Animator,job_Applications developer,job_Arboriculturist,job_Archaeologist,job_Architect,job_Architectural technologist,job_Archivist,job_Armed forces logistics/support/administrative officer,job_Armed forces technical officer,job_Armed forces training and education officer,job_Art gallery manager,job_Art therapist,job_Artist,job_Arts development officer,job_Associate Professor,job_Audiological scientist,job_Barista,job_Barrister,job_Barrister's clerk,"job_Biochemist, clinical",job_Biomedical engineer,job_Biomedical scientist,job_Bookseller,job_Broadcast engineer,job_Broadcast journalist,job_Broadcast presenter,job_Building control surveyor,job_Building services engineer,job_Building surveyor,"job_Buyer, industrial","job_Buyer, retail",job_Cabin crew,job_Call centre manager,job_Camera operator,job_Careers adviser,job_Careers information officer,job_Cartographer,job_Catering manager,job_Ceramics designer,job_Charity fundraiser,job_Charity officer,job_Chartered accountant,job_Chartered legal executive (England and Wales),job_Chartered loss adjuster,job_Chartered public finance accountant,job_Chemical engineer,"job_Chemist, analytical",job_Chief Executive Officer,job_Chief Financial Officer,job_Chief Marketing Officer,job_Chief Operating Officer,job_Chief Strategy Officer,job_Chief Technology Officer,job_Chief of Staff,job_Child psychotherapist,job_Chiropodist,job_Civil Service administrator,job_Civil Service fast streamer,"job_Civil engineer, contracting",job_Claims inspector/assessor,job_Clinical biochemist,job_Clinical cytogeneticist,job_Clinical psychologist,job_Clinical research associate,job_Clothing/textile technologist,job_Colour technologist,job_Commercial horticulturist,job_Commercial/residential surveyor,job_Commissioning editor,job_Communications engineer,job_Community arts worker,job_Community development worker,job_Community education officer,job_Community pharmacist,job_Company secretary,job_Comptroller,"job_Conservation officer, historic buildings","job_Conservator, furniture","job_Conservator, museum/gallery",job_Contracting civil engineer,job_Contractor,job_Control and instrumentation engineer,job_Copy,"job_Copywriter, advertising",job_Corporate investment banker,job_Counselling psychologist,job_Counsellor,job_Curator,job_Cytogeneticist,job_Dance movement psychotherapist,job_Dancer,job_Data scientist,job_Database administrator,job_Dealer,"job_Designer, ceramics/pottery","job_Designer, exhibition/display","job_Designer, furniture","job_Designer, industrial/product","job_Designer, interior/spatial","job_Designer, jewellery","job_Designer, multimedia","job_Designer, television/film set","job_Designer, textile","job_Development worker, community","job_Development worker, international aid",job_Diagnostic radiographer,job_Dispensing optician,"job_Doctor, general practice","job_Doctor, hospital",job_Drilling engineer,job_Early years teacher,job_Ecologist,job_Economist,"job_Editor, commissioning","job_Editor, film/video","job_Editor, magazine features",job_Education administrator,"job_Education officer, community","job_Education officer, museum",job_Educational psychologist,job_Electrical engineer,job_Electronics engineer,"job_Embryologist, clinical",job_Emergency planning/management officer,job_Energy engineer,job_Energy manager,"job_Engineer, aeronautical","job_Engineer, agricultural","job_Engineer, automotive","job_Engineer, biomedical","job_Engineer, broadcasting (operations)","job_Engineer, building services","job_Engineer, civil (consulting)","job_Engineer, civil (contracting)","job_Engineer, communications","job_Engineer, control and instrumentation","job_Engineer, drilling","job_Engineer, electronics","job_Engineer, land","job_Engineer, maintenance","job_Engineer, manufacturing","job_Engineer, materials","job_Engineer, mining","job_Engineer, petroleum","job_Engineer, production","job_Engineer, site","job_Engineer, structural","job_Engineer, technical sales",job_Engineering geologist,job_English as a foreign language teacher,job_English as a second language teacher,job_Environmental consultant,job_Environmental education officer,job_Environmental health practitioner,job_Environmental manager,job_Equality and diversity officer,job_Equities trader,job_Estate manager/land agent,job_Event organiser,job_Exercise physiologist,job_Exhibition designer,"job_Exhibitions officer, museum/gallery",job_Facilities manager,job_Farm manager,job_Field seismologist,job_Field trials officer,job_Film/video editor,job_Financial adviser,job_Financial trader,job_Fine artist,job_Firefighter,job_Fisheries officer,job_Fitness centre manager,job_Forensic psychologist,job_Forest/woodland manager,job_Freight forwarder,job_Furniture conservator/restorer,job_Furniture designer,job_Further education lecturer,job_Futures trader,job_Gaffer,job_Garment/textile technologist,job_General practice doctor,"job_Geneticist, molecular",job_Geochemist,"job_Geologist, engineering","job_Geologist, wellsite",job_Geophysicist/field seismologist,job_Geoscientist,job_Glass blower/designer,job_Health and safety adviser,job_Health physicist,job_Health promotion specialist,job_Health service manager,job_Health visitor,job_Herbalist,job_Heritage manager,job_Herpetologist,job_Higher education careers adviser,job_Historic buildings inspector/conservation officer,job_Homeopath,job_Horticultural consultant,job_Horticultural therapist,"job_Horticulturist, commercial",job_Hospital doctor,job_Hospital pharmacist,job_Hotel manager,job_Human resources officer,job_Hydrogeologist,job_Hydrographic surveyor,job_Hydrologist,job_IT consultant,job_IT trainer,job_Illustrator,job_Immigration officer,job_Immunologist,job_Industrial buyer,job_Industrial/product designer,job_Information officer,job_Information systems manager,job_Insurance broker,job_Insurance claims handler,job_Insurance risk surveyor,job_Insurance underwriter,job_Intelligence analyst,job_Interior and spatial designer,job_Interpreter,job_Investment analyst,"job_Investment banker, corporate","job_Investment banker, operational",job_Jewellery designer,"job_Journalist, newspaper",job_Land,job_Land/geomatics surveyor,job_Landscape architect,job_Lawyer,job_Learning disability nurse,job_Learning mentor,"job_Lecturer, further education","job_Lecturer, higher education",job_Legal secretary,job_Leisure centre manager,job_Lexicographer,"job_Librarian, academic","job_Librarian, public",job_Licensed conveyancer,job_Local government officer,job_Location manager,job_Logistics and distribution manager,"job_Loss adjuster, chartered",job_Magazine features editor,job_Magazine journalist,job_Maintenance engineer,job_Make,job_Management consultant,job_Manufacturing engineer,job_Manufacturing systems engineer,job_Market researcher,job_Marketing executive,job_Materials engineer,job_Mechanical engineer,job_Media buyer,job_Media planner,job_Medical physicist,job_Medical sales representative,job_Medical secretary,job_Medical technical officer,job_Mental health nurse,"job_Merchandiser, retail",job_Metallurgist,job_Minerals surveyor,job_Mining engineer,job_Mudlogger,job_Multimedia programmer,job_Museum education officer,job_Museum/gallery conservator,job_Museum/gallery exhibitions officer,job_Music therapist,job_Music tutor,job_Musician,job_Nature conservation officer,job_Naval architect,job_Network engineer,job_Neurosurgeon,"job_Nurse, children's","job_Nurse, mental health",job_Nutritional therapist,job_Occupational hygienist,job_Occupational psychologist,job_Occupational therapist,job_Oceanographer,job_Oncologist,job_Operational researcher,job_Operations geologist,"job_Optician, dispensing",job_Optometrist,job_Orthoptist,job_Osteopath,job_Outdoor activities/education manager,job_Paediatric nurse,job_Paramedic,job_Patent attorney,job_Pathologist,job_Pension scheme manager,job_Pensions consultant,job_Personnel officer,job_Petroleum engineer,"job_Pharmacist, community","job_Pharmacist, hospital",job_Pharmacologist,"job_Physicist, medical",job_Physiological scientist,job_Physiotherapist,job_Phytotherapist,"job_Pilot, airline",job_Planning and development surveyor,job_Plant breeder/geneticist,job_Podiatrist,job_Police officer,job_Politician's assistant,"job_Presenter, broadcasting",job_Press photographer,job_Press sub,job_Primary school teacher,job_Prison officer,job_Private music teacher,job_Probation officer,"job_Producer, radio","job_Producer, television/film/video",job_Product designer,job_Product manager,job_Product/process development scientist,"job_Production assistant, radio","job_Production assistant, television",job_Production engineer,job_Production manager,job_Professor Emeritus,"job_Programme researcher, broadcasting/film/video","job_Programmer, applications","job_Programmer, multimedia",job_Psychiatric nurse,job_Psychiatrist,"job_Psychologist, clinical","job_Psychologist, counselling","job_Psychologist, forensic","job_Psychologist, sport and exercise",job_Psychotherapist,"job_Psychotherapist, child",job_Public affairs consultant,job_Public house manager,job_Public librarian,job_Public relations account executive,job_Public relations officer,job_Purchasing manager,job_Quantity surveyor,job_Quarry manager,job_Race relations officer,job_Radio broadcast assistant,job_Radio producer,"job_Radiographer, diagnostic","job_Radiographer, therapeutic",job_Records manager,job_Regulatory affairs officer,"job_Research officer, political party","job_Research officer, trade union",job_Research scientist (life sciences),job_Research scientist (maths),job_Research scientist (medical),job_Research scientist (physical sciences),"job_Restaurant manager, fast food",job_Retail banker,job_Retail buyer,job_Retail manager,job_Retail merchandiser,job_Risk analyst,job_Rural practice surveyor,job_Sales executive,"job_Sales professional, IT",job_Sales promotion account executive,job_Science writer,job_Scientific laboratory technician,"job_Scientist, audiological","job_Scientist, biomedical","job_Scientist, clinical (histocompatibility and immunogenetics)","job_Scientist, marine","job_Scientist, physiological","job_Scientist, research (maths)","job_Scientist, research (medical)","job_Scientist, research (physical sciences)",job_Secondary school teacher,job_Secretary/administrator,job_Seismic interpreter,job_Senior tax professional/tax inspector,job_Set designer,job_Ship broker,job_Site engineer,"job_Social research officer, government",job_Social researcher,job_Soil scientist,job_Solicitor,"job_Solicitor, Scotland",job_Special educational needs teacher,job_Special effects artist,job_Sport and exercise psychologist,job_Sports administrator,job_Sports development officer,job_Stage manager,job_Statistician,job_Structural engineer,job_Sub,job_Surgeon,"job_Surveyor, hydrographic","job_Surveyor, land/geomatics","job_Surveyor, minerals","job_Surveyor, mining","job_Surveyor, rural practice",job_Systems analyst,job_Systems developer,job_TEFL teacher,job_Tax adviser,job_Tax inspector,"job_Teacher, English as a foreign language","job_Teacher, adult education","job_Teacher, early years/pre","job_Teacher, primary school","job_Teacher, secondary school","job_Teacher, special educational needs",job_Teaching laboratory technician,job_Technical brewer,job_Telecommunications researcher,job_Television camera operator,job_Television floor manager,job_Television production assistant,job_Television/film/video producer,job_Textile designer,job_Theatre director,job_Theatre manager,job_Theme park manager,"job_Therapist, art","job_Therapist, drama","job_Therapist, horticultural","job_Therapist, music","job_Therapist, occupational","job_Therapist, sports",job_Tour manager,job_Tourism officer,job_Tourist information centre manager,job_Town planner,job_Toxicologist,job_Trade mark attorney,job_Trading standards officer,job_Training and development officer,job_Transport planner,job_Travel agency manager,job_Tree surgeon,job_Veterinary surgeon,job_Video editor,job_Visual merchandiser,job_Volunteer coordinator,job_Warden/ranger,job_Warehouse manager,job_Waste management officer,job_Water engineer,job_Water quality scientist,job_Web designer,job_Wellsite geologist,job_Writer,gender_M
0,-0.128199,-0.294808,0.837537,0.114872,-0.751544,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1
1,-0.644575,-0.29728,0.29339,0.150394,0.688848,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2,-0.627316,-0.289582,-1.586253,-0.362977,-0.529945,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1
3,-0.788907,-0.294265,0.96942,-0.272699,0.467249,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1
4,-0.434148,-0.284328,-0.31137,0.616831,1.96304,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [41]:
print(f'X treino shape: {X_train_transformed.shape}')
print(f'X teste shape: {X_test_transformed.shape}')

X treino shape: (10508, 512)
X teste shape: (4504, 512)


In [42]:
def create_neural_network_model(shape: tuple[int, ...]) -> tf.keras.models.Sequential:
    
    model = tf.keras.models.Sequential(name='NeuralNetwork')

    model.add(tf.keras.Input(shape=shape, name='Input'))
    model.add(tf.keras.layers.Dense(units=64, kernel_initializer='random_uniform', activation='relu', name='Dense_1'))
    model.add(tf.keras.layers.Dense(units=32, kernel_initializer='random_uniform', activation='relu', name='Dense_2'))
    model.add(tf.keras.layers.Dense(units=1, kernel_initializer='random_uniform', activation='sigmoid', name='Dense_3'))

    model.compile(loss='binary_crossentropy', optimizer=tf.keras.optimizers.Adam(learning_rate=0.001), metrics=['accuracy'])

    return model

In [43]:
nn = create_neural_network_model(shape=(X_train_transformed.shape[1], ))

2024-08-20 15:37:09.370806: I metal_plugin/src/device/metal_device.cc:1154] Metal device set to: Apple M3 Pro
2024-08-20 15:37:09.370825: I metal_plugin/src/device/metal_device.cc:296] systemMemory: 18.00 GB
2024-08-20 15:37:09.370831: I metal_plugin/src/device/metal_device.cc:313] maxCacheSize: 6.00 GB
2024-08-20 15:37:09.370857: I tensorflow/core/common_runtime/pluggable_device/pluggable_device_factory.cc:306] Could not identify NUMA node of platform GPU ID 0, defaulting to 0. Your kernel may not have been built with NUMA support.
2024-08-20 15:37:09.370870: I tensorflow/core/common_runtime/pluggable_device/pluggable_device_factory.cc:272] Created TensorFlow device (/job:localhost/replica:0/task:0/device:GPU:0 with 0 MB memory) -> physical PluggableDevice (device: 0, name: METAL, pci bus id: <undefined>)


In [44]:
es = tf.keras.callbacks.EarlyStopping(monitor='loss', min_delta=1e-10, patience=5, verbose=1)
rlr = tf.keras.callbacks.ReduceLROnPlateau(monitor='loss', factor=0.2, patience=5, verbose=1)
nn.fit(X_train_transformed, y_train, epochs=100, callbacks=[es, rlr])

Epoch 1/100
  1/329 [..............................] - ETA: 1:50 - loss: 0.6930 - accuracy: 0.5938

2024-08-20 15:37:09.734099: I tensorflow/core/grappler/optimizers/custom_graph_optimizer_registry.cc:117] Plugin optimizer for device_type GPU is enabled.
2024-08-20 15:37:09.756703: E tensorflow/core/grappler/optimizers/meta_optimizer.cc:961] model_pruner failed: INVALID_ARGUMENT: Graph does not contain terminal node Adam/AssignAddVariableOp.


Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 9: ReduceLROnPlateau reducing learning rate to 0.00020000000949949026.
Epoch 9: early stopping


<keras.src.callbacks.History at 0x3a2a25ca0>

In [45]:
y_pred_test = nn.predict(X_test_transformed)



In [46]:
y_pred_test

array([[0.60656077],
       [0.44751185],
       [0.38648838],
       ...,
       [0.9366388 ],
       [0.15464488],
       [0.47072852]], dtype=float32)

In [47]:
y_pred_test_2 = y_pred_test > 0.5

In [48]:
accuracy_score(y_test, y_pred_test_2)

0.8376998223801065

# Treinar os modelos de machine learning

In [49]:
models_list = [LogisticRegression(random_state=0), RandomForestClassifier(), DecisionTreeClassifier(), KNeighborsClassifier(),
               create_neural_network_model(shape=(X_train_transformed.shape[1], ))]

df_results = pd.DataFrame(columns=['Model', 'accuracy train', 'accuracy test', 'precision train', 'precision test', 'recall train', 'recall test', 'f1 train', 'f1 test'])

results_index = 0

for model in tqdm(models_list):

    model_name = type(model).__name__
    os.makedirs(f'./Results/{model_name}/', exist_ok=True)
    
    if model_name == 'Sequential':
        es = tf.keras.callbacks.EarlyStopping(monitor='loss', min_delta=1e-10, patience=5, verbose=1)
        rlr = tf.keras.callbacks.ReduceLROnPlateau(monitor='loss', factor=0.2, patience=5, verbose=1)
        model.fit(X_train_transformed, y_train, epochs=100, callbacks=[es, rlr])
    else:
        model.fit(X_train_transformed, y_train)
    y_pred_train = model.predict(X_train_transformed)
    y_pred_test = model.predict(X_test_transformed)
    
    if model_name == 'Sequential':
        y_pred_train = y_pred_train > 0.5
        y_pred_test = y_pred_test > 0.5
    
    classes_on_target = y_train.unique()
    cm = confusion_matrix(y_test, y_pred_test, labels=classes_on_target)

    display_cm = ConfusionMatrixDisplay(confusion_matrix=cm, display_labels=classes_on_target)
    plt.figure(figsize=(16, 10))
    display_cm.plot()
    plt.savefig(f'./Results/{model_name}/ConfusionMatrix.png')
    plt.close()

    fpr, tpr, thresholds = roc_curve(y_test, y_pred_test)
    roc_auc = auc(fpr, tpr)
    display_roc = RocCurveDisplay(fpr=fpr, tpr=tpr, roc_auc=roc_auc, estimator_name=f'{model_name}')
    plt.figure(figsize=(16, 10))
    display_roc.plot()
    plt.savefig(f'./Results/{model_name}/ROC.png')
    plt.close()
    
    accuracy_train = accuracy_score(y_train, y_pred_train)
    precision_train = precision_score(y_train, y_pred_train)
    recall_train = recall_score(y_train, y_pred_train)
    f1_train = f1_score(y_train, y_pred_train)

    accuracy_test = accuracy_score(y_test, y_pred_test)
    precision_test = precision_score(y_test, y_pred_test)
    recall_test = recall_score(y_test, y_pred_test)
    f1_test = f1_score(y_test, y_pred_test)

    df_results.loc[results_index, 'Model'] = model_name
    df_results.loc[results_index, 'accuracy train'] = np.round(accuracy_train,4)
    df_results.loc[results_index, 'accuracy test'] = np.round(accuracy_test,4)
    df_results.loc[results_index, 'precision train'] = np.round(precision_train,4)
    df_results.loc[results_index, 'precision test'] = np.round(precision_test,4)
    df_results.loc[results_index, 'recall train'] = np.round(recall_train,4)
    df_results.loc[results_index, 'recall test'] = np.round(recall_test,4)
    df_results.loc[results_index, 'f1 train'] = np.round(f1_train,4)
    df_results.loc[results_index, 'f1 test'] = np.round(f1_test,4)
    
    results_index += 1

df_results.sort_values(by='accuracy test', ascending=False, inplace=True)
df_results.to_excel('./Results/all_results.xlsx', engine='openpyxl', index=False)

 80%|████████  | 4/5 [00:04<00:01,  1.13s/it]

Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 14: ReduceLROnPlateau reducing learning rate to 0.00020000000949949026.
Epoch 14: early stopping


100%|██████████| 5/5 [00:24<00:00,  4.90s/it]


<Figure size 1600x1000 with 0 Axes>

<Figure size 1600x1000 with 0 Axes>

<Figure size 1600x1000 with 0 Axes>

<Figure size 1600x1000 with 0 Axes>

<Figure size 1600x1000 with 0 Axes>

<Figure size 1600x1000 with 0 Axes>

<Figure size 1600x1000 with 0 Axes>

<Figure size 1600x1000 with 0 Axes>

<Figure size 1600x1000 with 0 Axes>

<Figure size 1600x1000 with 0 Axes>

In [50]:
df_results

Unnamed: 0,Model,accuracy train,accuracy test,precision train,precision test,recall train,recall test,f1 train,f1 test
2,DecisionTreeClassifier,1.0,0.9552,1.0,0.9488,1.0,0.9623,1.0,0.9555
1,RandomForestClassifier,1.0,0.9498,1.0,0.9647,1.0,0.9338,1.0,0.949
0,LogisticRegression,0.8494,0.837,0.8957,0.8799,0.7908,0.7806,0.84,0.8273
3,KNeighborsClassifier,0.8831,0.8337,0.9256,0.8767,0.8333,0.7766,0.877,0.8236
4,Sequential,0.822,0.8257,0.8653,0.8695,0.7628,0.7664,0.8108,0.8147
