## Practice with Jupyter Notebook

I'm reworking assignment 2 to practice commiting to GitHub from a local file.

In [1]:
import pandas as pd
import numpy as np

In [6]:
# # fetch data with bash command
# !curl https://archive.ics.uci.edu/ml/machine-learning-databases/auto-mpg/auto-mpg.data-original

# # save data file locally
# !wget https://archive.ics.uci.edu/ml/machine-learning-databases/auto-mpg/auto-mpg.data-original

# !curl worked on Windows, but !wget didn't. *reminder* ask someone if !wget will work on Windows or if there's a different command

In [28]:
# Load data
# This UCI Machine Learning dataset has 2 links for the same data, but both datasets have different issues
mpg_data_url_original = 'https://archive.ics.uci.edu/ml/machine-learning-databases/auto-mpg/auto-mpg.data-original'
mpg_data_url_revised = 'https://archive.ics.uci.edu/ml/machine-learning-databases/auto-mpg/auto-mpg.data'

df_original = pd.read_csv(mpg_data_url_original, header=None, sep='\s+', names=['mpg', 'cylinders', 'displacement', 'horsepower',
                                                             'weight', 'acceleration', 'model year', 'origin', 'car name'])
df_revised = pd.read_csv(mpg_data_url_revised, header=None, sep='\s+',
                        names=['mpg', 'cylinders', 'displacement', 'horsepower', 'weight', 'acceleration', 'model year',
                              'origin', 'car name'])
print('Original Dataset: \n', df_original.head())
print('\n\nRevised Dataset: \n', df_revised.head())

Original Dataset: 
     mpg  cylinders  displacement  horsepower  weight  acceleration  \
0  18.0        8.0         307.0       130.0  3504.0          12.0   
1  15.0        8.0         350.0       165.0  3693.0          11.5   
2  18.0        8.0         318.0       150.0  3436.0          11.0   
3  16.0        8.0         304.0       150.0  3433.0          12.0   
4  17.0        8.0         302.0       140.0  3449.0          10.5   

   model year  origin                   car name  
0        70.0     1.0  chevrolet chevelle malibu  
1        70.0     1.0          buick skylark 320  
2        70.0     1.0         plymouth satellite  
3        70.0     1.0              amc rebel sst  
4        70.0     1.0                ford torino  


Revised Dataset: 
     mpg  cylinders  displacement horsepower  weight  acceleration  model year  \
0  18.0          8         307.0      130.0  3504.0          12.0          70   
1  15.0          8         350.0      165.0  3693.0          11.5     

In [29]:
# Check for missing data in original dataset
print(df_original.isnull().sum())
print(df_original.dtypes)

mpg             8
cylinders       0
displacement    0
horsepower      6
weight          0
acceleration    0
model year      0
origin          0
car name        0
dtype: int64
mpg             float64
cylinders       float64
displacement    float64
horsepower      float64
weight          float64
acceleration    float64
model year      float64
origin          float64
car name         object
dtype: object


In the original dataset we have missing data in the mpg and horsepower column, but all of the data types are correct

In [30]:
# Check for missing data in revised dataset
print(df_revised.isnull().sum())
print(df_revised.dtypes)

mpg             0
cylinders       0
displacement    0
horsepower      0
weight          0
acceleration    0
model year      0
origin          0
car name        0
dtype: int64
mpg             float64
cylinders         int64
displacement    float64
horsepower       object
weight          float64
acceleration    float64
model year        int64
origin            int64
car name         object
dtype: object


In the revised dataset we don't show any missing data (but we know it's there), and the horsepower column shows type object instead of float

In [31]:
# Convert '?' values to NaN
df_original_nan = df_original.replace('?', np.NaN)
df_revised_nan = df_revised.replace('?', np.NaN)

print('Original Data: \n', df_original_nan.isnull().sum())
print('Revised Data: \n', df_revised_nan.isnull().sum())

Original Data: 
 mpg             8
cylinders       0
displacement    0
horsepower      6
weight          0
acceleration    0
model year      0
origin          0
car name        0
dtype: int64
Revised Data: 
 mpg             0
cylinders       0
displacement    0
horsepower      6
weight          0
acceleration    0
model year      0
origin          0
car name        0
dtype: int64


In [32]:
# Fill forward to replace NaN values
df_original_no_nan = df_original_nan.fillna(method='ffill')
df_revised_no_nan = df_revised_nan.fillna(method='ffill')

print('Original Data: \n', df_original_no_nan.isnull().sum())
print('Revised Data: \n', df_revised_no_nan.isnull().sum())

Original Data: 
 mpg             0
cylinders       0
displacement    0
horsepower      0
weight          0
acceleration    0
model year      0
origin          0
car name        0
dtype: int64
Revised Data: 
 mpg             0
cylinders       0
displacement    0
horsepower      0
weight          0
acceleration    0
model year      0
origin          0
car name        0
dtype: int64


In [33]:
# Convert horsepower data in revised dataset from object to float
df_revised_no_nan['horsepower'] = df_revised_no_nan['horsepower'].astype(float)
df_revised_no_nan.dtypes

mpg             float64
cylinders         int64
displacement    float64
horsepower      float64
weight          float64
acceleration    float64
model year        int64
origin            int64
car name         object
dtype: object

In [34]:
# Use one hot encoding to convert categorical data to boolean
df_original_cleaned = pd.get_dummies(df_original_no_nan, columns=['car name'])
df_revised_cleaned = pd.get_dummies(df_revised_no_nan, columns=['car name'])

In [35]:
# Set display options to see all columns
pd.set_option('display.max_columns', 500)
pd.set_option('display.width', 1000)

# Inspect cleaned original dataset
df_original_cleaned.head()

Unnamed: 0,mpg,cylinders,displacement,horsepower,weight,acceleration,model year,origin,car name_amc ambassador brougham,car name_amc ambassador dpl,car name_amc ambassador sst,car name_amc concord,car name_amc concord d/l,car name_amc concord dl,car name_amc concord dl 6,car name_amc gremlin,car name_amc hornet,car name_amc hornet sportabout (sw),car name_amc matador,car name_amc matador (sw),car name_amc pacer,car name_amc pacer d/l,car name_amc rebel sst,car name_amc rebel sst (sw),car name_amc spirit dl,car name_audi 100 ls,car name_audi 100ls,car name_audi 4000,car name_audi 5000,car name_audi 5000s (diesel),car name_audi fox,car name_bmw 2002,car name_bmw 320i,car name_buick century,car name_buick century 350,car name_buick century limited,car name_buick century luxus (sw),car name_buick century special,car name_buick electra 225 custom,car name_buick estate wagon (sw),car name_buick lesabre custom,car name_buick opel isuzu deluxe,car name_buick regal sport coupe (turbo),car name_buick skyhawk,car name_buick skylark,car name_buick skylark 320,car name_buick skylark limited,car name_cadillac eldorado,car name_cadillac seville,car name_capri ii,car name_chevroelt chevelle malibu,car name_chevrolet bel air,car name_chevrolet camaro,car name_chevrolet caprice classic,car name_chevrolet cavalier,car name_chevrolet cavalier 2-door,car name_chevrolet cavalier wagon,car name_chevrolet chevelle concours (sw),car name_chevrolet chevelle malibu,car name_chevrolet chevelle malibu classic,car name_chevrolet chevette,car name_chevrolet citation,car name_chevrolet concours,car name_chevrolet impala,car name_chevrolet malibu,car name_chevrolet malibu classic (sw),car name_chevrolet monte carlo,car name_chevrolet monte carlo landau,car name_chevrolet monte carlo s,car name_chevrolet monza 2+2,car name_chevrolet nova,car name_chevrolet nova custom,car name_chevrolet vega,car name_chevrolet vega (sw),car name_chevrolet vega 2300,car name_chevrolet woody,car name_chevy c10,car name_chevy c20,car name_chevy s-10,car name_chrysler cordoba,car name_chrysler lebaron medallion,car name_chrysler lebaron salon,car name_chrysler lebaron town @ country (sw),car name_chrysler new yorker brougham,car name_chrysler newport royal,car name_citroen ds-21 pallas,car name_datsun 1200,car name_datsun 200-sx,car name_datsun 200sx,car name_datsun 210,car name_datsun 210 mpg,car name_datsun 280-zx,car name_datsun 310,car name_datsun 310 gx,car name_datsun 510,car name_datsun 510 (sw),car name_datsun 510 hatchback,car name_datsun 610,car name_datsun 710,car name_datsun 810,car name_datsun 810 maxima,car name_datsun b-210,car name_datsun b210,car name_datsun b210 gx,car name_datsun f-10 hatchback,car name_datsun pl510,car name_dodge aries se,car name_dodge aries wagon (sw),car name_dodge aspen,car name_dodge aspen 6,car name_dodge aspen se,car name_dodge challenger se,car name_dodge charger 2.2,car name_dodge colt,car name_dodge colt (sw),car name_dodge colt hardtop,car name_dodge colt hatchback custom,car name_dodge colt m/m,car name_dodge coronet brougham,car name_dodge coronet custom,car name_dodge coronet custom (sw),car name_dodge d100,car name_dodge d200,car name_dodge dart custom,car name_dodge diplomat,car name_dodge magnum xe,car name_dodge monaco (sw),car name_dodge monaco brougham,car name_dodge omni,car name_dodge rampage,car name_dodge st. regis,car name_fiat 124 sport coupe,car name_fiat 124 tc,car name_fiat 124b,car name_fiat 128,car name_fiat 131,car name_fiat strada custom,car name_fiat x1.9,car name_ford country,car name_ford country squire (sw),car name_ford escort 2h,car name_ford escort 4w,car name_ford f108,car name_ford f250,car name_ford fairmont,car name_ford fairmont (auto),car name_ford fairmont (man),car name_ford fairmont 4,car name_ford fairmont futura,car name_ford fiesta,car name_ford futura,car name_ford galaxie 500,car name_ford gran torino,car name_ford gran torino (sw),car name_ford granada,car name_ford granada ghia,car name_ford granada gl,car name_ford granada l,car name_ford ltd,car name_ford ltd landau,car name_ford maverick,car name_ford mustang,car name_ford mustang boss 302,car name_ford mustang cobra,car name_ford mustang gl,car name_ford mustang ii,car name_ford mustang ii 2+2,car name_ford pinto,car name_ford pinto (sw),car name_ford pinto runabout,car name_ford ranger,car name_ford thunderbird,car name_ford torino,car name_ford torino (sw),car name_ford torino 500,car name_hi 1200d,car name_honda accord,car name_honda accord cvcc,car name_honda accord lx,car name_honda civic,car name_honda civic (auto),car name_honda civic 1300,car name_honda civic 1500 gl,car name_honda civic cvcc,car name_honda prelude,car name_maxda glc deluxe,car name_maxda rx3,car name_mazda 626,car name_mazda glc,car name_mazda glc 4,car name_mazda glc custom,car name_mazda glc custom l,car name_mazda glc deluxe,car name_mazda rx-4,car name_mazda rx-7 gs,car name_mazda rx2 coupe,car name_mercedes benz 300d,car name_mercedes-benz 240d,car name_mercedes-benz 280s,car name_mercury capri 2000,car name_mercury capri v6,car name_mercury cougar brougham,car name_mercury grand marquis,car name_mercury lynx l,car name_mercury marquis,car name_mercury marquis brougham,car name_mercury monarch,car name_mercury monarch ghia,car name_mercury zephyr,car name_mercury zephyr 6,car name_nissan stanza xe,car name_oldsmobile cutlass ciera (diesel),car name_oldsmobile cutlass ls,car name_oldsmobile cutlass salon brougham,car name_oldsmobile cutlass supreme,car name_oldsmobile delta 88 royale,car name_oldsmobile omega,car name_oldsmobile omega brougham,car name_oldsmobile starfire sx,car name_oldsmobile vista cruiser,car name_opel 1900,car name_opel manta,car name_peugeot 304,car name_peugeot 504,car name_peugeot 504 (sw),car name_peugeot 505s turbo diesel,car name_peugeot 604sl,car name_plymouth 'cuda 340,car name_plymouth arrow gs,car name_plymouth champ,car name_plymouth cricket,car name_plymouth custom suburb,car name_plymouth duster,car name_plymouth fury,car name_plymouth fury gran sedan,car name_plymouth fury iii,car name_plymouth grand fury,car name_plymouth horizon,car name_plymouth horizon 4,car name_plymouth horizon miser,car name_plymouth horizon tc3,car name_plymouth reliant,car name_plymouth sapporo,car name_plymouth satellite,car name_plymouth satellite (sw),car name_plymouth satellite custom,car name_plymouth satellite custom (sw),car name_plymouth satellite sebring,car name_plymouth valiant,car name_plymouth valiant custom,car name_plymouth volare,car name_plymouth volare custom,car name_plymouth volare premier v8,car name_pontiac astro,car name_pontiac catalina,car name_pontiac catalina brougham,car name_pontiac firebird,car name_pontiac grand prix,car name_pontiac grand prix lj,car name_pontiac j2000 se hatchback,car name_pontiac lemans v6,car name_pontiac phoenix,car name_pontiac phoenix lj,car name_pontiac safari (sw),car name_pontiac sunbird coupe,car name_pontiac ventura sj,car name_renault 12 (sw),car name_renault 12tl,car name_renault 18i,car name_renault 5 gtl,car name_renault lecar deluxe,car name_saab 900s,car name_saab 99e,car name_saab 99gle,car name_saab 99le,car name_subaru,car name_subaru dl,car name_toyota carina,car name_toyota celica gt,car name_toyota celica gt liftback,car name_toyota corolla,car name_toyota corolla 1200,car name_toyota corolla 1600 (sw),car name_toyota corolla liftback,car name_toyota corolla tercel,car name_toyota corona,car name_toyota corona hardtop,car name_toyota corona liftback,car name_toyota corona mark ii,car name_toyota cressida,car name_toyota mark ii,car name_toyota starlet,car name_toyota tercel,car name_toyouta corona mark ii (sw),car name_triumph tr7 coupe,car name_vokswagen rabbit,car name_volkswagen 1131 deluxe sedan,car name_volkswagen 411 (sw),car name_volkswagen dasher,car name_volkswagen jetta,car name_volkswagen model 111,car name_volkswagen rabbit,car name_volkswagen rabbit custom,car name_volkswagen rabbit custom diesel,car name_volkswagen rabbit l,car name_volkswagen scirocco,car name_volkswagen super beetle,car name_volkswagen super beetle 117,car name_volkswagen type 3,car name_volvo 144ea,car name_volvo 145e (sw),car name_volvo 244dl,car name_volvo 245,car name_volvo 264gl,car name_volvo diesel,car name_vw dasher (diesel),car name_vw pickup,car name_vw rabbit,car name_vw rabbit c (diesel),car name_vw rabbit custom
0,18.0,8.0,307.0,130.0,3504.0,12.0,70.0,1.0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
1,15.0,8.0,350.0,165.0,3693.0,11.5,70.0,1.0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2,18.0,8.0,318.0,150.0,3436.0,11.0,70.0,1.0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
3,16.0,8.0,304.0,150.0,3433.0,12.0,70.0,1.0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
4,17.0,8.0,302.0,140.0,3449.0,10.5,70.0,1.0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [36]:
# Inspect cleaned revised dataset
df_revised_cleaned.head()

Unnamed: 0,mpg,cylinders,displacement,horsepower,weight,acceleration,model year,origin,car name_amc ambassador brougham,car name_amc ambassador dpl,car name_amc ambassador sst,car name_amc concord,car name_amc concord d/l,car name_amc concord dl,car name_amc concord dl 6,car name_amc gremlin,car name_amc hornet,car name_amc hornet sportabout (sw),car name_amc matador,car name_amc matador (sw),car name_amc pacer,car name_amc pacer d/l,car name_amc rebel sst,car name_amc spirit dl,car name_audi 100 ls,car name_audi 100ls,car name_audi 4000,car name_audi 5000,car name_audi 5000s (diesel),car name_audi fox,car name_bmw 2002,car name_bmw 320i,car name_buick century,car name_buick century 350,car name_buick century limited,car name_buick century luxus (sw),car name_buick century special,car name_buick electra 225 custom,car name_buick estate wagon (sw),car name_buick lesabre custom,car name_buick opel isuzu deluxe,car name_buick regal sport coupe (turbo),car name_buick skyhawk,car name_buick skylark,car name_buick skylark 320,car name_buick skylark limited,car name_cadillac eldorado,car name_cadillac seville,car name_capri ii,car name_chevroelt chevelle malibu,car name_chevrolet bel air,car name_chevrolet camaro,car name_chevrolet caprice classic,car name_chevrolet cavalier,car name_chevrolet cavalier 2-door,car name_chevrolet cavalier wagon,car name_chevrolet chevelle concours (sw),car name_chevrolet chevelle malibu,car name_chevrolet chevelle malibu classic,car name_chevrolet chevette,car name_chevrolet citation,car name_chevrolet concours,car name_chevrolet impala,car name_chevrolet malibu,car name_chevrolet malibu classic (sw),car name_chevrolet monte carlo,car name_chevrolet monte carlo landau,car name_chevrolet monte carlo s,car name_chevrolet monza 2+2,car name_chevrolet nova,car name_chevrolet nova custom,car name_chevrolet vega,car name_chevrolet vega (sw),car name_chevrolet vega 2300,car name_chevrolet woody,car name_chevy c10,car name_chevy c20,car name_chevy s-10,car name_chrysler cordoba,car name_chrysler lebaron medallion,car name_chrysler lebaron salon,car name_chrysler lebaron town @ country (sw),car name_chrysler new yorker brougham,car name_chrysler newport royal,car name_datsun 1200,car name_datsun 200-sx,car name_datsun 200sx,car name_datsun 210,car name_datsun 210 mpg,car name_datsun 280-zx,car name_datsun 310,car name_datsun 310 gx,car name_datsun 510,car name_datsun 510 (sw),car name_datsun 510 hatchback,car name_datsun 610,car name_datsun 710,car name_datsun 810,car name_datsun 810 maxima,car name_datsun b-210,car name_datsun b210,car name_datsun b210 gx,car name_datsun f-10 hatchback,car name_datsun pl510,car name_dodge aries se,car name_dodge aries wagon (sw),car name_dodge aspen,car name_dodge aspen 6,car name_dodge aspen se,car name_dodge challenger se,car name_dodge charger 2.2,car name_dodge colt,car name_dodge colt (sw),car name_dodge colt hardtop,car name_dodge colt hatchback custom,car name_dodge colt m/m,car name_dodge coronet brougham,car name_dodge coronet custom,car name_dodge coronet custom (sw),car name_dodge d100,car name_dodge d200,car name_dodge dart custom,car name_dodge diplomat,car name_dodge magnum xe,car name_dodge monaco (sw),car name_dodge monaco brougham,car name_dodge omni,car name_dodge rampage,car name_dodge st. regis,car name_fiat 124 sport coupe,car name_fiat 124 tc,car name_fiat 124b,car name_fiat 128,car name_fiat 131,car name_fiat strada custom,car name_fiat x1.9,car name_ford country,car name_ford country squire (sw),car name_ford escort 2h,car name_ford escort 4w,car name_ford f108,car name_ford f250,car name_ford fairmont,car name_ford fairmont (auto),car name_ford fairmont (man),car name_ford fairmont 4,car name_ford fairmont futura,car name_ford fiesta,car name_ford futura,car name_ford galaxie 500,car name_ford gran torino,car name_ford gran torino (sw),car name_ford granada,car name_ford granada ghia,car name_ford granada gl,car name_ford granada l,car name_ford ltd,car name_ford ltd landau,car name_ford maverick,car name_ford mustang,car name_ford mustang cobra,car name_ford mustang gl,car name_ford mustang ii,car name_ford mustang ii 2+2,car name_ford pinto,car name_ford pinto (sw),car name_ford pinto runabout,car name_ford ranger,car name_ford thunderbird,car name_ford torino,car name_ford torino 500,car name_hi 1200d,car name_honda accord,car name_honda accord cvcc,car name_honda accord lx,car name_honda civic,car name_honda civic (auto),car name_honda civic 1300,car name_honda civic 1500 gl,car name_honda civic cvcc,car name_honda prelude,car name_maxda glc deluxe,car name_maxda rx3,car name_mazda 626,car name_mazda glc,car name_mazda glc 4,car name_mazda glc custom,car name_mazda glc custom l,car name_mazda glc deluxe,car name_mazda rx-4,car name_mazda rx-7 gs,car name_mazda rx2 coupe,car name_mercedes benz 300d,car name_mercedes-benz 240d,car name_mercedes-benz 280s,car name_mercury capri 2000,car name_mercury capri v6,car name_mercury cougar brougham,car name_mercury grand marquis,car name_mercury lynx l,car name_mercury marquis,car name_mercury marquis brougham,car name_mercury monarch,car name_mercury monarch ghia,car name_mercury zephyr,car name_mercury zephyr 6,car name_nissan stanza xe,car name_oldsmobile cutlass ciera (diesel),car name_oldsmobile cutlass ls,car name_oldsmobile cutlass salon brougham,car name_oldsmobile cutlass supreme,car name_oldsmobile delta 88 royale,car name_oldsmobile omega,car name_oldsmobile omega brougham,car name_oldsmobile starfire sx,car name_oldsmobile vista cruiser,car name_opel 1900,car name_opel manta,car name_peugeot 304,car name_peugeot 504,car name_peugeot 504 (sw),car name_peugeot 505s turbo diesel,car name_peugeot 604sl,car name_plymouth 'cuda 340,car name_plymouth arrow gs,car name_plymouth champ,car name_plymouth cricket,car name_plymouth custom suburb,car name_plymouth duster,car name_plymouth fury,car name_plymouth fury gran sedan,car name_plymouth fury iii,car name_plymouth grand fury,car name_plymouth horizon,car name_plymouth horizon 4,car name_plymouth horizon miser,car name_plymouth horizon tc3,car name_plymouth reliant,car name_plymouth sapporo,car name_plymouth satellite,car name_plymouth satellite custom,car name_plymouth satellite custom (sw),car name_plymouth satellite sebring,car name_plymouth valiant,car name_plymouth valiant custom,car name_plymouth volare,car name_plymouth volare custom,car name_plymouth volare premier v8,car name_pontiac astro,car name_pontiac catalina,car name_pontiac catalina brougham,car name_pontiac firebird,car name_pontiac grand prix,car name_pontiac grand prix lj,car name_pontiac j2000 se hatchback,car name_pontiac lemans v6,car name_pontiac phoenix,car name_pontiac phoenix lj,car name_pontiac safari (sw),car name_pontiac sunbird coupe,car name_pontiac ventura sj,car name_renault 12 (sw),car name_renault 12tl,car name_renault 18i,car name_renault 5 gtl,car name_renault lecar deluxe,car name_saab 99e,car name_saab 99gle,car name_saab 99le,car name_subaru,car name_subaru dl,car name_toyota carina,car name_toyota celica gt,car name_toyota celica gt liftback,car name_toyota corolla,car name_toyota corolla 1200,car name_toyota corolla 1600 (sw),car name_toyota corolla liftback,car name_toyota corolla tercel,car name_toyota corona,car name_toyota corona hardtop,car name_toyota corona liftback,car name_toyota corona mark ii,car name_toyota cressida,car name_toyota mark ii,car name_toyota starlet,car name_toyota tercel,car name_toyouta corona mark ii (sw),car name_triumph tr7 coupe,car name_vokswagen rabbit,car name_volkswagen 1131 deluxe sedan,car name_volkswagen 411 (sw),car name_volkswagen dasher,car name_volkswagen jetta,car name_volkswagen model 111,car name_volkswagen rabbit,car name_volkswagen rabbit custom,car name_volkswagen rabbit custom diesel,car name_volkswagen rabbit l,car name_volkswagen scirocco,car name_volkswagen super beetle,car name_volkswagen type 3,car name_volvo 144ea,car name_volvo 145e (sw),car name_volvo 244dl,car name_volvo 245,car name_volvo 264gl,car name_volvo diesel,car name_vw dasher (diesel),car name_vw pickup,car name_vw rabbit,car name_vw rabbit c (diesel),car name_vw rabbit custom
0,18.0,8,307.0,130.0,3504.0,12.0,70,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
1,15.0,8,350.0,165.0,3693.0,11.5,70,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2,18.0,8,318.0,150.0,3436.0,11.0,70,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
3,16.0,8,304.0,150.0,3433.0,12.0,70,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
4,17.0,8,302.0,140.0,3449.0,10.5,70,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [38]:
df_revised_cleaned.shape

(398, 313)

In [39]:
df_original_cleaned.shape

(406, 320)

Not sure why there are more observations in the original dataset. It's possible that some bad data was removed when it was updated.