# Phase 4 - Get Dummies

## Columns:

**Categorical Columns**  
- make_model
- body_type
- vat
- registration_year
- type
- inspection_new
- body_color
- paint_type
- upholstery_material
- gearing_type
- fuel
- emission_class
- drive_chain
- entertainment_media
- safety_security
- comfort_convenience
- extras
 
**Quantitative Columns**
- price
- km
- co2_emission
- consumption_combined
- consumption_country
- consumption_city
- hp
- displacement
- warranty
- previous_owners
- weight
- nr_of_doors
- nr_of_seats
- cylinders
- gears


---

In [141]:
import matplotlib.pyplot as plt
%matplotlib inline
import numpy as np
import pandas as pd
from scipy import stats
import seaborn as sns
import warnings;
warnings.filterwarnings("ignore")
import re
pd.set_option("display.max_columns",None)

In [142]:
auto = pd.read_csv("car_data_3_no_outliers.csv")
df = auto.copy()

In [143]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 15915 entries, 0 to 15914
Data columns (total 32 columns):
 #   Column                Non-Null Count  Dtype  
---  ------                --------------  -----  
 0   make_model            15915 non-null  object 
 1   body_type             15915 non-null  object 
 2   price                 15915 non-null  int64  
 3   vat                   15915 non-null  object 
 4   km                    15915 non-null  float64
 5   hp                    15915 non-null  float64
 6   type                  15915 non-null  object 
 7   previous_owners       15915 non-null  float64
 8   inspection_new        15915 non-null  object 
 9   warranty              15915 non-null  float64
 10  body_color            15915 non-null  object 
 11  paint_type            15915 non-null  object 
 12  nr_of_doors           15915 non-null  float64
 13  nr_of_seats           15915 non-null  float64
 14  gearing_type          15915 non-null  object 
 15  displacement       

In [144]:
object_columns = ['make_model', 'body_type', 'vat', 'type', 'body_color', 'paint_type', 
                  'gearing_type', 'gears', 'drive_chain', 'fuel', 'emission_class']
df_dummied = pd.get_dummies(df, columns= object_columns, drop_first=True, dtype=int)

In [145]:
df_dummied.columns

Index(['price', 'km', 'hp', 'previous_owners', 'inspection_new', 'warranty',
       'nr_of_doors', 'nr_of_seats', 'displacement', 'cylinders', 'weight',
       'co2_emission', 'comfort_convenience', 'entertainment_media', 'extras',
       'safety_security', 'age', 'upholstery_material', 'consumption_combined',
       'consumption_city', 'consumption_country', 'make_model_Audi A2',
       'make_model_Audi A3', 'make_model_Opel Astra', 'make_model_Opel Corsa',
       'make_model_Opel Insignia', 'make_model_Renault Clio',
       'make_model_Renault Duster', 'make_model_Renault Espace',
       'body_type_Convertible', 'body_type_Coupe', 'body_type_Off-Road',
       'body_type_Other', 'body_type_Sedans', 'body_type_Station wagon',
       'body_type_Transporter', 'body_type_Van', 'vat_VAT deductible',
       'vat_VAT undeductible', 'type_Employee's car', 'type_New',
       'type_Pre-registered', 'type_Used', 'body_color_Black',
       'body_color_Blue', 'body_color_Bronze', 'body_color_Brown

In [146]:
df_dummied["make_model_Audi A3"]

0        0
1        0
2        0
3        0
4        0
        ..
15910    0
15911    0
15912    0
15913    0
15914    0
Name: make_model_Audi A3, Length: 15915, dtype: int64

## Apply get_dummies method to columns extras, comfort_convenience, entertainment_media

In [147]:
df['extras'].astype('str').str.replace('[','').str.replace("]",'').str.get_dummies(sep=', ')

Unnamed: 0,'Alloy wheels','Cab or rented Car','Catalytic Converter','Handicapped enabled','Right hand drive','Roof rack','Shift paddles','Ski bag','Sliding door','Sport package','Sport seats','Sport suspension','Touch screen','Trailer hitch','Tuned car','Voice Control','Winter tyres'
0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0
1,1,0,0,0,0,0,0,0,0,0,1,1,0,0,0,1,0
2,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0
3,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0
4,1,0,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
15910,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0
15911,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0
15912,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
15913,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0


In [148]:
def fill(method, df, column, group_cols=None):
   """
   Fills NaN values in `df[column]` either using the overall mean, median or mode (no grouping)
   or group-specific mean, median or mode (group_col provided).
   Prints stats about how many NaNs were filled and the final distribution.
   """
   # Make a copy of the dataframe to avoid modification warnings
   working_df = df.copy()
   
   # Debug prints: which column is being filled, and grouping info.
   print('Filling column:', column)
   print('Grouping by:', group_cols)
   
   # 1. Count NaNs before filling
   nan_before = working_df[column].isnull().sum()
   
   # 2. Fill logic
   if method in ['mean', 'median']:
       if group_cols is None:
           # Fill all NaN in 'column' with the overall mean/median
           working_df[column].fillna(getattr(working_df[column], method)(), inplace=True)
       else:
           # Calculate groupwise mean/median for each row
           group = working_df.groupby(group_cols)[column].transform(method)
           # Fill missing values in df[column] with corresponding group mean/median
           working_df[column].fillna(group, inplace=True)
   
   elif method == 'mode':
       if group_cols is None:
           # Fill all NaN in 'column' with the overall mode
           working_df[column].fillna(working_df[column].mode().iloc[0], inplace=True)            
       else:
           # Calculate groupwise mode for each row
           group = working_df.groupby(group_cols)[column]\
           .transform(lambda x: x.mode()[0] if list(x.mode()) != [] else np.nan)
           # Fill missing values in df[column] with corresponding group mode
           working_df[column].fillna(group, inplace=True)
   
   # 3. Count NaNs after filling
   nan_after = working_df[column].isnull().sum()
   nan_filled = nan_before - nan_after
   
   # 4. Print final stats
   print("Number of NaN before filling:", nan_before)
   print("Number of NaN filled:", nan_filled)
   print("Number of NaN after filling:", nan_after)
   print("------------------")
   print(working_df[column].value_counts(dropna=False))
   
   return working_df

In [149]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 15915 entries, 0 to 15914
Data columns (total 32 columns):
 #   Column                Non-Null Count  Dtype  
---  ------                --------------  -----  
 0   make_model            15915 non-null  object 
 1   body_type             15915 non-null  object 
 2   price                 15915 non-null  int64  
 3   vat                   15915 non-null  object 
 4   km                    15915 non-null  float64
 5   hp                    15915 non-null  float64
 6   type                  15915 non-null  object 
 7   previous_owners       15915 non-null  float64
 8   inspection_new        15915 non-null  object 
 9   warranty              15915 non-null  float64
 10  body_color            15915 non-null  object 
 11  paint_type            15915 non-null  object 
 12  nr_of_doors           15915 non-null  float64
 13  nr_of_seats           15915 non-null  float64
 14  gearing_type          15915 non-null  object 
 15  displacement       

In [150]:
df_extras = df['extras'].astype('str').str.replace('[','').str.replace("]",'').str.get_dummies(sep=', ')

In [151]:
df_extras.sum()

'Alloy wheels'           14050
'Cab or rented Car'        310
'Catalytic Converter'     2262
'Handicapped enabled'       52
'Right hand drive'           3
'Roof rack'               2956
'Shift paddles'            508
'Ski bag'                  251
'Sliding door'               3
'Sport package'           1201
'Sport seats'             3104
'Sport suspension'        1622
'Touch screen'            4052
'Trailer hitch'            658
'Tuned car'                 13
'Voice Control'           4338
'Winter tyres'             246
dtype: int64

In [152]:
df_comfort = df['comfort_convenience'].astype('str').str.replace('[','').str.replace("]",'').str.get_dummies(sep=', ')

In [153]:
df['entertainment_media'][1]

"'Bluetooth', 'Hands-free equipment', 'On-board computer', 'Radio', 'Sound system'"

In [154]:
df_entertainment = df['entertainment_media'].astype('str').str.replace('[','').str.replace("]",'').str.get_dummies(sep=', ')

In [155]:
df_entertainment.drop(columns=['nan'], inplace=True)

In [156]:
df_entertainment

Unnamed: 0,'Bluetooth','CD player','Digital radio','Hands-free equipment','MP3','On-board computer','Radio','Sound system','Television','USB'
0,1,0,0,1,0,1,1,0,0,0
1,1,0,0,1,0,1,1,1,0,0
2,0,0,0,0,1,1,0,0,0,0
3,1,1,0,1,1,1,1,1,0,1
4,1,1,0,1,1,1,1,0,0,1
...,...,...,...,...,...,...,...,...,...,...
15910,1,0,1,1,0,1,1,0,0,1
15911,1,0,1,1,0,0,1,0,0,1
15912,1,0,0,1,0,1,1,0,0,0
15913,1,0,1,0,0,0,1,0,0,1


In [157]:
df_safety = df['safety_security'].astype('str').str.replace('[','').str.replace("]",'').str.get_dummies(sep=', ')

## Drop columns with less 1's

In [158]:
df_extras.sum()

'Alloy wheels'           14050
'Cab or rented Car'        310
'Catalytic Converter'     2262
'Handicapped enabled'       52
'Right hand drive'           3
'Roof rack'               2956
'Shift paddles'            508
'Ski bag'                  251
'Sliding door'               3
'Sport package'           1201
'Sport seats'             3104
'Sport suspension'        1622
'Touch screen'            4052
'Trailer hitch'            658
'Tuned car'                 13
'Voice Control'           4338
'Winter tyres'             246
dtype: int64

In [159]:
df_extras.columns = df_extras.columns.str.replace("'","").str.lower().str.replace(" ","_")

In [160]:
df_extras.drop(["right_hand_drive","sliding_door","tuned_car","handicapped_enabled"], axis=1,inplace=True)

In [161]:
df_comfort.columns = df_comfort.columns.str.replace("'","").str.lower().str.replace(" ","_")

In [162]:
df_comfort.sum().sort_values(ascending=False)

air_conditioning                       15099
power_windows                          14756
electrical_side_mirrors                12374
multi-function_steering_wheel          11778
cruise_control                         11695
park_distance_control                  10689
parking_assist_system_sensors_rear     10049
leather_steering_wheel                  9771
start-stop_system                       9422
automatic_climate_control               9270
rain_sensor                             9096
navigation_system                       8574
light_sensor                            7995
armrest                                 7691
seat_heating                            7454
hill_holder                             7227
parking_assist_system_sensors_front     6121
parking_assist_system_camera            3587
lumbar_support                          3439
heated_steering_wheel                   3170
keyless_central_door_lock               2755
split_rear_seats                        2393
electrical

In [163]:
df_comfort.drop(columns=["electric_starter","windshield","wind_deflector", "air_suspension"], inplace=True)

In [164]:
df_entertainment.drop(columns=["'Television'"], inplace=True)
df_safety.drop(columns=["'Night view assist'"], inplace=True)

## Fill leather_seats column with upholstery_material column

In [165]:
index_leather = df_dummied[(df_dummied['upholstery_material']=='Part leather') \
           | (df_dummied['upholstery_material']=='Full leather') \
           | (df_dummied['upholstery_material']=='alcantara') \
           | (df_dummied['upholstery_material']=='Velour')]['upholstery_material'].index

In [166]:
df_comfort.loc[index_leather, 'leather_seats'] = 1

In [167]:
df_dummied.drop('upholstery_material',axis=1,inplace=True)

In [168]:
df_dummied.drop(columns=['comfort_convenience', 'safety_security', 'entertainment_media', 'extras'],inplace=True)

In [169]:
df_dummied.drop('drive_chain_rear', axis=1,inplace=True)

## Concat all dummy dataframes

In [170]:
df_final = pd.concat([df_dummied, df_extras, df_comfort, df_entertainment, df_safety], axis = 1)

In [171]:
df_final.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 15915 entries, 0 to 15914
Columns: 149 entries, price to 'Xenon headlights'
dtypes: float64(14), int64(134), object(1)
memory usage: 18.1+ MB


In [172]:
df_dummied

Unnamed: 0,price,km,hp,previous_owners,inspection_new,warranty,nr_of_doors,nr_of_seats,displacement,cylinders,weight,co2_emission,age,consumption_combined,consumption_city,consumption_country,make_model_Audi A2,make_model_Audi A3,make_model_Opel Astra,make_model_Opel Corsa,make_model_Opel Insignia,make_model_Renault Clio,make_model_Renault Duster,make_model_Renault Espace,body_type_Convertible,body_type_Coupe,body_type_Off-Road,body_type_Other,body_type_Sedans,body_type_Station wagon,body_type_Transporter,body_type_Van,vat_VAT deductible,vat_VAT undeductible,type_Employee's car,type_New,type_Pre-registered,type_Used,body_color_Black,body_color_Blue,body_color_Bronze,body_color_Brown,body_color_Green,body_color_Grey,body_color_Orange,body_color_Red,body_color_Silver,body_color_Violet,body_color_White,body_color_Yellow,paint_type_Perl effect,paint_type_Uni/basic,gearing_type_Manual,gearing_type_Semi-automatic,gears_6.0,gears_7.0,gears_8.0,gears_9.0,gears_50.0,drive_chain_front,fuel_Diesel,fuel_Electric,fuel_LPG/CNG,emission_class_Euro 5,emission_class_Euro 6
0,15770,56013.0,66.0,2.0,Yes,0.0,5.0,5.0,1422.0,3.0,1220.0,99.0,3.0,3.80,4.3,3.5,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1
1,14500,80000.0,141.0,1.0,No,0.0,3.0,4.0,1798.0,4.0,1255.0,129.0,2.0,5.60,7.1,4.7,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1
2,14640,83450.0,85.0,1.0,No,0.0,4.0,4.0,1598.0,4.0,1275.0,99.0,3.0,3.80,4.4,3.4,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1
3,14500,73000.0,66.0,1.0,No,0.0,3.0,4.0,1422.0,3.0,1195.0,99.0,3.0,3.80,4.3,3.5,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1
4,16790,16200.0,66.0,1.0,Yes,0.0,5.0,5.0,1422.0,3.0,1195.0,109.0,3.0,4.10,4.6,3.8,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
15910,39950,15.0,147.0,1.0,No,24.0,5.0,5.0,1997.0,4.0,1758.0,139.0,0.0,5.30,6.2,4.7,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1
15911,39885,9900.0,165.0,1.0,No,0.0,5.0,5.0,1798.0,4.0,1708.0,168.0,0.0,6.65,7.0,6.3,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1
15912,39875,15.0,146.0,1.0,Yes,0.0,5.0,7.0,1997.0,4.0,1779.0,139.0,0.0,5.30,6.2,4.7,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1
15913,39700,10.0,147.0,1.0,No,0.0,5.0,7.0,1997.0,4.0,1758.0,139.0,0.0,5.30,6.2,4.7,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1


In [173]:
df_final.isnull().sum().sum()

0

In [174]:
df_final

Unnamed: 0,price,km,hp,previous_owners,inspection_new,warranty,nr_of_doors,nr_of_seats,displacement,cylinders,weight,co2_emission,age,consumption_combined,consumption_city,consumption_country,make_model_Audi A2,make_model_Audi A3,make_model_Opel Astra,make_model_Opel Corsa,make_model_Opel Insignia,make_model_Renault Clio,make_model_Renault Duster,make_model_Renault Espace,body_type_Convertible,body_type_Coupe,body_type_Off-Road,body_type_Other,body_type_Sedans,body_type_Station wagon,body_type_Transporter,body_type_Van,vat_VAT deductible,vat_VAT undeductible,type_Employee's car,type_New,type_Pre-registered,type_Used,body_color_Black,body_color_Blue,body_color_Bronze,body_color_Brown,body_color_Green,body_color_Grey,body_color_Orange,body_color_Red,body_color_Silver,body_color_Violet,body_color_White,body_color_Yellow,paint_type_Perl effect,paint_type_Uni/basic,gearing_type_Manual,gearing_type_Semi-automatic,gears_6.0,gears_7.0,gears_8.0,gears_9.0,gears_50.0,drive_chain_front,fuel_Diesel,fuel_Electric,fuel_LPG/CNG,emission_class_Euro 5,emission_class_Euro 6,alloy_wheels,cab_or_rented_car,catalytic_converter,roof_rack,shift_paddles,ski_bag,sport_package,sport_seats,sport_suspension,touch_screen,trailer_hitch,voice_control,winter_tyres,air_conditioning,armrest,automatic_climate_control,auxiliary_heating,cruise_control,electric_tailgate,electrical_side_mirrors,electrically_adjustable_seats,electrically_heated_windshield,heads-up_display,heated_steering_wheel,hill_holder,keyless_central_door_lock,leather_seats,leather_steering_wheel,light_sensor,lumbar_support,massage_seats,multi-function_steering_wheel,navigation_system,panorama_roof,park_distance_control,parking_assist_system_camera,parking_assist_system_self-steering,parking_assist_system_sensors_front,parking_assist_system_sensors_rear,power_windows,rain_sensor,seat_heating,seat_ventilation,split_rear_seats,start-stop_system,sunroof,tinted_windows,'Bluetooth','CD player','Digital radio','Hands-free equipment','MP3','On-board computer','Radio','Sound system','USB','ABS','Adaptive Cruise Control','Adaptive headlights','Alarm system','Blind spot monitor','Central door lock with remote control','Central door lock','Daytime running lights','Driver drowsiness detection','Driver-side airbag','Electronic stability control','Emergency brake assistant','Emergency system','Fog lights','Head airbag','Immobilizer','Isofix','LED Daytime Running Lights','LED Headlights','Lane departure warning system','Passenger-side airbag','Power steering','Rear airbag','Side airbag','Tire pressure monitoring system','Traction control','Traffic sign recognition','Xenon headlights'
0,15770,56013.0,66.0,2.0,Yes,0.0,5.0,5.0,1422.0,3.0,1220.0,99.0,3.0,3.80,4.3,3.5,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1,1,0,1,0,0,0,0,0,0,0,0,1,0,1,1,1,0,1,0,1,0,0,0,0,1,0,0,1,1,0,0,1,1,0,1,0,0,0,1,1,1,1,0,0,1,0,0,1,0,0,1,0,1,1,0,0,1,0,0,0,0,0,1,1,0,1,1,0,0,1,0,1,1,0,0,0,1,1,0,1,1,1,0,1
1,14500,80000.0,141.0,1.0,No,0.0,3.0,4.0,1798.0,4.0,1255.0,129.0,2.0,5.60,7.1,4.7,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,1,0,0,0,0,0,0,1,1,0,0,1,0,1,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,1,0,0,0,0,0,0,0,0,1,1,0,0,0,0,1,0,1,1,0,0,1,0,1,1,1,0,1,0,0,0,0,1,1,1,0,1,1,0,0,0,1,1,1,0,0,0,1,1,0,1,1,1,0,1
2,14640,83450.0,85.0,1.0,No,0.0,4.0,4.0,1598.0,4.0,1275.0,99.0,3.0,3.80,4.4,3.4,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,1,0,0,0,0,1,0,0,1,0,0,0,1,1,0,1,0,0,1,1,1,0,1,0,0,1,0,0,0,0,0,0,1,1,0,0,0,1,0,0,0,0,0,1,1,0,1,1,0,0,0,0,1,1,0,0,0,1,1,0,1,1,1,0,0
3,14500,73000.0,66.0,1.0,No,0.0,3.0,4.0,1422.0,3.0,1195.0,99.0,3.0,3.80,4.3,3.5,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1,1,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,1,0,0,1,0,0,1,0,1,0,0,1,1,1,0,1,1,0,0,0,0,0,0,1,1,1,0,1,1,0,0,1,1,0,1,1,1,1,1,1,1,0,0,1,0,1,0,0,1,1,1,0,1,0,1,1,1,0,0,0,1,1,0,1,1,0,0,0
4,16790,16200.0,66.0,1.0,Yes,0.0,5.0,5.0,1422.0,3.0,1195.0,109.0,3.0,4.10,4.6,3.8,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1,1,0,0,0,0,0,1,0,1,0,0,1,0,1,1,1,0,0,0,1,0,0,0,0,1,0,0,1,1,0,0,1,0,0,1,0,0,0,1,1,1,0,0,0,1,0,0,1,1,0,1,1,1,1,0,1,1,0,0,0,0,0,1,0,0,1,1,0,0,1,0,1,1,0,0,0,1,1,0,1,1,1,0,1
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
15910,39950,15.0,147.0,1.0,No,24.0,5.0,5.0,1997.0,4.0,1758.0,139.0,0.0,5.30,6.2,4.7,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1,1,0,0,0,0,0,0,0,0,1,0,0,0,1,0,1,0,1,0,1,1,0,0,0,1,1,1,1,1,0,1,1,1,0,1,0,0,1,1,1,1,0,0,1,1,0,1,1,0,1,1,0,1,1,0,1,1,0,0,0,0,1,1,0,0,1,1,1,0,0,1,1,1,1,1,1,1,1,1,1,1,1,1,0
15911,39885,9900.0,165.0,1.0,No,0.0,5.0,5.0,1798.0,4.0,1708.0,168.0,0.0,6.65,7.0,6.3,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,1,0,0,0,0,0,0,0,0,1,0,1,0,1,0,1,0,1,1,1,0,1,1,1,1,1,0,1,1,1,0,0,1,0,1,1,1,1,1,1,1,1,0,0,0,1,0,1,0,1,1,0,0,1,0,1,1,1,0,0,1,0,1,1,0,1,1,1,0,0,0,1,1,1,1,1,1,1,0,1,1,1,1,0
15912,39875,15.0,146.0,1.0,Yes,0.0,5.0,7.0,1997.0,4.0,1779.0,139.0,0.0,5.30,6.2,4.7,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,0,1,1,1,0,1,1,1,0,0,1,1,1,0,1,1,1,1,1,1,0,1,1,1,1,1,1,0,0,1,0,1,0,0,1,0,1,1,0,0,1,1,0,0,1,0,1,1,0,1,1,1,0,0,0,1,1,1,1,1,1,1,0,1,0,1,1,0
15913,39700,10.0,147.0,1.0,No,0.0,5.0,7.0,1997.0,4.0,1758.0,139.0,0.0,5.30,6.2,4.7,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1,1,0,0,0,0,0,0,0,0,1,0,0,0,1,0,1,0,1,0,1,1,0,0,0,0,0,1,1,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,1,0,0,1,0,1,0,0,0,1,0,1,1,0,0,0,1,0,0,0,0,1,1,1,0,0,0,0,1,0,1,0,1,1,0,1,1,0,1,0


In [175]:
df.to_csv('car_data_4_final_drew_gervang.csv', index = False)