In [1]:
import os
import pandas as pd

PATH = os.getcwd() #Pulls your current working directory
FILE = 'Customers.csv'
FULL_PATH = os.path.join(PATH, FILE) #Joins directory and file as one string

#Import data from file
data = pd.read_csv(FULL_PATH, sep='\t', encoding='utf-8') 
data.head()

Unnamed: 0,Customer_ID,Last_Name,First_Name,Sex,Age,ZIP,Plan,Plan_Start_Date,Customer_Since,Salesman_EID
0,1000.0,Howard,Tommy,M,42,97199,Basic,2023-01-12,2008-01-13,70045
1,1001.0,Vásquez,Sean,M,28,97373,Platinum,2023-09-12,2009-11-23,367032
2,1002.0,Clark,Jayce,M,70,97147,Basic,2023-02-06,2021-02-09,362455
3,1003.0,Rodríguez,Aria,F,19,97410,Gold,2022-05-28,2011-03-10,821007
4,1004.0,Muñoz,Claude,M,33,97360,Basic,2023-05-30,2011-08-17,208762


In [2]:
print('Number of Customers:', len(data),'\n') #Number of rows in data set

#Print number of values for each column
for column in data.columns.tolist():
    print(column,':',data.loc[:, column].count())

Number of Customers: 36806 

Customer_ID : 36764
Last_Name : 36806
First_Name : 36806
Sex : 36806
Age : 36806
ZIP : 36806
Plan : 36806
Plan_Start_Date : 36806
Customer_Since : 36806
Salesman_EID : 36806


In [3]:
#Table data in hash table/dictionary format
my_dict = data.iloc[:2, :].to_dict(orient='dict')
my_dict

{'Customer_ID': {0: 1000.0, 1: 1001.0},
 'Last_Name': {0: 'Howard', 1: 'Vásquez'},
 'First_Name': {0: 'Tommy', 1: 'Sean'},
 'Sex': {0: 'M', 1: 'M'},
 'Age': {0: 42, 1: 28},
 'ZIP': {0: 97199, 1: 97373},
 'Plan': {0: 'Basic', 1: 'Platinum'},
 'Plan_Start_Date': {0: '2023-01-12', 1: '2023-09-12'},
 'Customer_Since': {0: '2008-01-13', 1: '2009-11-23'},
 'Salesman_EID': {0: 70045, 1: 367032}}

In [4]:
def check_data_types(dataframe):
    data_types = [] #List to hold results
    for col in dataframe.columns.tolist(): #Loop through each column
        data_type_set = set() #Set to remove duplicates
        for idx in dataframe.index.tolist(): #In each column, loop through each row
            data_type_set.add(type(dataframe.loc[idx, col])) #Add data type of each row item
        data_types.append([col, data_type_set]) #Add results of loop to final list

    return pd.DataFrame(data_types, columns=['Column','Data_Types'])

check_data_types(data) #Execute function

Unnamed: 0,Column,Data_Types
0,Customer_ID,{<class 'numpy.float64'>}
1,Last_Name,{<class 'str'>}
2,First_Name,{<class 'str'>}
3,Sex,{<class 'str'>}
4,Age,{<class 'numpy.int64'>}
5,ZIP,{<class 'numpy.int64'>}
6,Plan,{<class 'str'>}
7,Plan_Start_Date,{<class 'str'>}
8,Customer_Since,{<class 'str'>}
9,Salesman_EID,{<class 'numpy.int64'>}


In [5]:
#Check to see how long the full loop takes
%timeit check_data_types(data)

4.79 s ± 57.4 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)


In [6]:
def quick_dt_chk(dataframe):
    for col in dataframe.columns.tolist():
        try:
            print(f'Sum of {col}:',sum(dataframe.loc[:,col]))
        except:
            print(f'No summable data types in {col}.')
            
quick_dt_chk(data)

Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509


In [7]:
#Check to see how long the sum loop takes
%timeit quick_dt_chk(data)

Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summ

Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP:

Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summ

Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 1823854350

Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summa

Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP:

Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summ

Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summ

Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summ

Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summa

Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summ

Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 1823854350

Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summa

Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summa

Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP:

Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP:

Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summa

Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 1823854350

Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summa

Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summ

Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP:

Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP:

Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 1823854350

Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 1823854350

Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summa

Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 18238543509
Sum of Customer_ID: nan
No summable data types in Last_Name.
No summable data types in First_Name.
No summable data types in Sex.
Sum of Age: 1753627
Sum of ZIP: 3580885928
No summable data types in Plan.
No summable data types in Plan_Start_Date.
No summable data types in Customer_Since.
Sum of Salesman_EID: 1823854350

In [8]:
#Full loop vs. quick sum
5/0.0168

297.61904761904765

In [9]:
#Adding string values to categorical columns with missing values
new_cids = data.loc[:,['Customer_ID']].fillna('MISSING') #Fill NaNs
data['Customer_ID'] = new_cids #Assign new string values to existing DataFrame
df_missing = data.query('Customer_ID == "MISSING"') #Filter by MISSING
df_missing.head()

Unnamed: 0,Customer_ID,Last_Name,First_Name,Sex,Age,ZIP,Plan,Plan_Start_Date,Customer_Since,Salesman_EID
36714,MISSING,López,Tommy,M,27,97199,Basic,2023-02-18,2009-10-18,594587
36715,MISSING,Wright,Sean,M,23,97373,Platinum,2022-02-14,2004-05-19,893970
36716,MISSING,Young,Jayce,M,42,97147,Platinum,2023-08-29,2016-12-22,335090
36717,MISSING,Torres,Aria,F,67,97410,Basic,2023-05-05,2023-08-24,133196
36718,MISSING,Sanders,Claude,M,23,97360,Gold,2022-03-21,2012-10-20,501466


In [10]:
#Removing duplicates
data.drop_duplicates(inplace=True)
len(data)

36756

In [11]:
#Difference between initial number and number without duplicates
36806 - 36756

50