# World Lab Chicago Data Cleaning

In [1]:
# Dependencies
import matplotlib
from matplotlib import pyplot as plt
from scipy import stats
import numpy as np
import pandas as pd
from scipy.stats import linregress

In [2]:
# Import csv file
mailing_list_data = pd.read_csv("data/world_lab_chicago_mailing_list.csv")
mailing_list_data

Unnamed: 0,Date List Produced,Record Obsolescence Date,Source,COMPANYNAME,ADDRESS,CITY,STATE,ZIPCODE,MAILING CARRIER ROUTE,MAILING DELIVERY POINT BAR CODE,...,SECONDARY SIC DESCRIPTION #1,SECONDARY SIC #2,SECONDARY SIC DESCRIPTION #2,METRO AREA,DATA AXLE USA ID,LAST NAME,FIRST NAME,CONTACT TITLE,CONTACT PROF TITLE,CONTACT GENDER
0,Sep 14 2021,Mar 14 2022,Data Axle,12 Group Inc,462 N Mclean Blvd,Elgin,IL,60123-3240,C050,621.0,...,Laboratories-Dental,,,"Chicago-Npvl, IL",728986869,,,,,
1,Sep 14 2021,Mar 14 2022,Data Axle,151st Street Dental,9017 W 151st St,Orland Park,IL,60462-3201,C015,178.0,...,Dentists,,,"Chicago-Npvl, IL",403683151,,,,,
2,Sep 14 2021,Mar 14 2022,Data Axle,176 Dental Assoc LTD,176 S Bloomingdale Rd # A,Bloomingdale,IL,60108-1404,C012,736.0,...,Dentists,,,"Chicago-Npvl, IL",402741733,Matustik,Joseph,OWNER,,Male
3,Sep 14 2021,Mar 14 2022,Data Axle,1st American Dental,2749 W Cermak Rd,Chicago,IL,60608-4682,C019,992.0,...,Dentists,,,"Chicago-Npvl, IL",748693205,Aqel,Fadi M,OPERATIONS,,Male
4,Sep 14 2021,Mar 14 2022,Data Axle,1st Dental Care,1556 Douglas Rd,Montgomery,IL,60538-1645,C002,561.0,...,Dentists,,,"Chicago-Npvl, IL",424726060,Malaki,Abdul,PRESIDENT,,Male
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5956,Sep 14 2021,Mar 14 2022,Data Axle,Mark R Zelko DDS,2305 Silvernail Rd,Pewaukee,WI,53072-5402,R016,57.0,...,Dentists,,,"Milwaukee, WI",715687831,Zelko,Mark R,,DDS,Male
5957,Sep 14 2021,Mar 14 2022,Data Axle,Kenneth J Zganjar DDS,6051 W Brown Deer Rd # 201,Milwaukee,WI,53223-2263,C050,516.0,...,Dentists,,,"Milwaukee, WI",146289947,Zganjar,Kenneth J,,DDS,Male
5958,Sep 14 2021,Mar 14 2022,Data Axle,Henry E Zimmermann DDS,190 Gardner Ave # 7,Burlington,WI,53105-2160,C014,70.0,...,Dentists,,,"Racine, WI",437502198,Zimmermann,Henry E,,DDS,Male
5959,Sep 14 2021,Mar 14 2022,Data Axle,Ziolkowski Dental Sc,3970 N Oakland Ave # 403,Shorewood,WI,53211-2265,C043,30.0,...,Dentists,596104.0,E-Commerce,"Milwaukee, WI",261216170,Ziolkowski,Keith Alan,PRESIDENT,,Male


In [3]:
# Create New Dataframe
mailing_list_df = mailing_list_data.loc[:, ["COMPANYNAME", "ADDRESS", "CITY", "STATE", "ZIPCODE", "COUNTY", "PRIMARYSICDESCRIPTION"]]
mailing_list_df

Unnamed: 0,COMPANYNAME,ADDRESS,CITY,STATE,ZIPCODE,COUNTY,PRIMARYSICDESCRIPTION
0,12 Group Inc,462 N Mclean Blvd,Elgin,IL,60123-3240,Kane,Laboratories-Dental
1,151st Street Dental,9017 W 151st St,Orland Park,IL,60462-3201,Cook,Dentists
2,176 Dental Assoc LTD,176 S Bloomingdale Rd # A,Bloomingdale,IL,60108-1404,Du Page,Dentists
3,1st American Dental,2749 W Cermak Rd,Chicago,IL,60608-4682,Cook,Dentists
4,1st Dental Care,1556 Douglas Rd,Montgomery,IL,60538-1645,Kane,Dentists
...,...,...,...,...,...,...,...
5956,Mark R Zelko DDS,2305 Silvernail Rd,Pewaukee,WI,53072-5402,Waukesha,Dentists
5957,Kenneth J Zganjar DDS,6051 W Brown Deer Rd # 201,Milwaukee,WI,53223-2263,Milwaukee,Dentists
5958,Henry E Zimmermann DDS,190 Gardner Ave # 7,Burlington,WI,53105-2160,Racine,Dentists
5959,Ziolkowski Dental Sc,3970 N Oakland Ave # 403,Shorewood,WI,53211-2265,Milwaukee,Dentists


In [4]:
# Drop Null Values
mailing_list_df = mailing_list_df.dropna(how="any")
mailing_list_df

Unnamed: 0,COMPANYNAME,ADDRESS,CITY,STATE,ZIPCODE,COUNTY,PRIMARYSICDESCRIPTION
0,12 Group Inc,462 N Mclean Blvd,Elgin,IL,60123-3240,Kane,Laboratories-Dental
1,151st Street Dental,9017 W 151st St,Orland Park,IL,60462-3201,Cook,Dentists
2,176 Dental Assoc LTD,176 S Bloomingdale Rd # A,Bloomingdale,IL,60108-1404,Du Page,Dentists
3,1st American Dental,2749 W Cermak Rd,Chicago,IL,60608-4682,Cook,Dentists
4,1st Dental Care,1556 Douglas Rd,Montgomery,IL,60538-1645,Kane,Dentists
...,...,...,...,...,...,...,...
5956,Mark R Zelko DDS,2305 Silvernail Rd,Pewaukee,WI,53072-5402,Waukesha,Dentists
5957,Kenneth J Zganjar DDS,6051 W Brown Deer Rd # 201,Milwaukee,WI,53223-2263,Milwaukee,Dentists
5958,Henry E Zimmermann DDS,190 Gardner Ave # 7,Burlington,WI,53105-2160,Racine,Dentists
5959,Ziolkowski Dental Sc,3970 N Oakland Ave # 403,Shorewood,WI,53211-2265,Milwaukee,Dentists


In [5]:
# Rename Columns
mailing_list_cleaned_df = mailing_list_df.rename(columns ={
    "COMPANYNAME": "Company Name",
    "ADDRESS": "Address",
    "CITY": "City",
    "STATE": "State",
    "ZIPCODE": "Zip Code",
    "COUNTY": "County",
    "PRIMARYSICDESCRIPTION": "Primary SIC Description"
})
# Reset index
mailing_list_cleaned_df.reset_index(drop=True, inplace=True)
mailing_list_cleaned_df

Unnamed: 0,Company Name,Address,City,State,Zip Code,County,Primary SIC Description
0,12 Group Inc,462 N Mclean Blvd,Elgin,IL,60123-3240,Kane,Laboratories-Dental
1,151st Street Dental,9017 W 151st St,Orland Park,IL,60462-3201,Cook,Dentists
2,176 Dental Assoc LTD,176 S Bloomingdale Rd # A,Bloomingdale,IL,60108-1404,Du Page,Dentists
3,1st American Dental,2749 W Cermak Rd,Chicago,IL,60608-4682,Cook,Dentists
4,1st Dental Care,1556 Douglas Rd,Montgomery,IL,60538-1645,Kane,Dentists
...,...,...,...,...,...,...,...
5955,Mark R Zelko DDS,2305 Silvernail Rd,Pewaukee,WI,53072-5402,Waukesha,Dentists
5956,Kenneth J Zganjar DDS,6051 W Brown Deer Rd # 201,Milwaukee,WI,53223-2263,Milwaukee,Dentists
5957,Henry E Zimmermann DDS,190 Gardner Ave # 7,Burlington,WI,53105-2160,Racine,Dentists
5958,Ziolkowski Dental Sc,3970 N Oakland Ave # 403,Shorewood,WI,53211-2265,Milwaukee,Dentists


In [6]:
#Export csv file
mailing_list_cleaned_df.to_csv(r'data/world_lab_chicago_mailing_list_cleaned.csv')