In [2]:
# Dependencies
import pandas as pd
from pathlib import Path

In [4]:
# Reference the file where the CSV is located
appliances_file = Path("../Resources/dga_lpg.csv")

# Import the data into a Pandas DataFrame
appliances_df = pd.read_csv(appliances_file)

appliances_df.head()

Unnamed: 0,Part,Type,Type.1,Brand,牌子,Model,Other Information,其他資料,Place of Manufacture,製造地點,Applicant,申請人,Telephone Number,Approval Expiry Date
0,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,嵌入式單頭平面爐,De Dietrich,,DTG1288XC,CERAMIC GLASS TOP PANEL,陶瓷玻璃面版,Italy,意大利,Gilman Group Limited,太平洋行國際有限公司,2418 3272,2023-09-26
1,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,嵌入式單頭平面爐,Electrolux,伊萊克斯,EGC-2901,CERAMIC GLASS TOP PANEL,陶瓷玻璃面版,The People's Republic of China,中華人民共和國,"Dah Chong Hong, Ltd.",大昌貿易行有限公司,2262 1690,2024-06-24
2,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,嵌入式單頭平面爐,Gaggenau,,VG231120F,STAINLESS STEEL TOP PANEL,不銹鋼面版,France,法國,Kitchen Infinity Corp. Ltd.,Kitchen Infinity Corp. Ltd.,2552 2208,2024-04-01
3,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,嵌入式單頭平面爐,Gaggenau,,VG231114F,STAINLESS STEEL TOP PANEL,不銹鋼面版,France,法國,Kitchen Infinity Corp. Ltd.,Kitchen Infinity Corp. Ltd.,2552 2208,2022-07-19
4,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,嵌入式單頭平面爐,GERMAN POOL,德國寶,GP12-1-LG,GLASS TOP PANEL,玻璃面版,The People's Republic of China,中華人民共和國,German Pool (Hong Kong) Ltd.,德國寶（香港）有限公司,2773 2812,2025-02-15


In [5]:
# Reduce to columns that are in English
appliances_clean_df = appliances_df[["Part", "Type", "Brand", "Model", "Other Information", "Place of Manufacture", 
                              "Applicant", "Telephone Number", "Approval Expiry Date"]]

appliances_clean_df.head()

Unnamed: 0,Part,Type,Brand,Model,Other Information,Place of Manufacture,Applicant,Telephone Number,Approval Expiry Date
0,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,De Dietrich,DTG1288XC,CERAMIC GLASS TOP PANEL,Italy,Gilman Group Limited,2418 3272,2023-09-26
1,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,Electrolux,EGC-2901,CERAMIC GLASS TOP PANEL,The People's Republic of China,"Dah Chong Hong, Ltd.",2262 1690,2024-06-24
2,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,Gaggenau,VG231120F,STAINLESS STEEL TOP PANEL,France,Kitchen Infinity Corp. Ltd.,2552 2208,2024-04-01
3,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,Gaggenau,VG231114F,STAINLESS STEEL TOP PANEL,France,Kitchen Infinity Corp. Ltd.,2552 2208,2022-07-19
4,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,GERMAN POOL,GP12-1-LG,GLASS TOP PANEL,The People's Republic of China,German Pool (Hong Kong) Ltd.,2773 2812,2025-02-15


In [6]:
# Look for missing values
appliances_clean_df.count()

Part                    939
Type                    939
Brand                   939
Model                   939
Other Information       936
Place of Manufacture    939
Applicant               939
Telephone Number        939
Approval Expiry Date    939
dtype: int64

In [7]:
# Drop null rows
nonull_app_df = appliances_clean_df.dropna(how='any')

In [8]:
# Verify counts
nonull_app_df.count()

Part                    936
Type                    936
Brand                   936
Model                   936
Other Information       936
Place of Manufacture    936
Applicant               936
Telephone Number        936
Approval Expiry Date    936
dtype: int64

In [10]:
# List unique values of "Applicant" to locate any that may be the same
nonull_app_df["Applicant"].unique()

array(['Gilman Group Limited', 'Dah Chong Hong, Ltd.',
       'Kitchen Infinity Corp. Ltd.', 'German Pool (Hong Kong) Ltd.',
       'World Engineering Limited', 'Hibachi Gas Cooker Limited',
       'Whirlpool (Hong Kong) Ltd.', 'Miele (Hong Kong) Limited',
       'Dong Woo Industrial Co. Ltd.', 'BSH Home Appliances Ltd.',
       'The Union Gas Appliances (Holdings) Ltd.',
       'Whampo Trading Limited', 'Sunny Eternal Limited',
       'Toptech Co. Limited', 'D & A Electronics Co., Ltd.',
       'Fidelity (Far East) Trading Co., Ltd.',
       'Araytron Technology Limited', 'Charm Vantage Limited',
       'Lighting Gas Stoves Trading Ltd', 'Lighting (Japan) Trading Ltd.',
       'Homepro International Limited',
       'The Hong Kong & China Gas Co., Ltd.',
       'Energy Trading Company Limited',
       'Wealthy Link International Trading Limited',
       'Wetol Company Limited',
       'Crown Gas Stoves (Holdings) Company Limited',
       'Iwatani Corporation (Hong Kong) Limited',
    

In [12]:
# Combine similar applicants together
nonull_app_df = nonull_app_df.replace({"Crown Gas Stoves (Holdings) Company Limited": "Crown Gas Stoves Co., Ltd.", 
     "Sun Kee LP Gas Co.": "Sun Kee LP Gas Co. Limited"})

nonull_app_df.head()

Unnamed: 0,Part,Type,Brand,Model,Other Information,Place of Manufacture,Applicant,Telephone Number,Approval Expiry Date
0,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,De Dietrich,DTG1288XC,CERAMIC GLASS TOP PANEL,Italy,Gilman Group Limited,2418 3272,2023-09-26
1,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,Electrolux,EGC-2901,CERAMIC GLASS TOP PANEL,The People's Republic of China,"Dah Chong Hong, Ltd.",2262 1690,2024-06-24
2,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,Gaggenau,VG231120F,STAINLESS STEEL TOP PANEL,France,Kitchen Infinity Corp. Ltd.,2552 2208,2024-04-01
3,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,Gaggenau,VG231114F,STAINLESS STEEL TOP PANEL,France,Kitchen Infinity Corp. Ltd.,2552 2208,2022-07-19
4,Part 1 – Approved Domestic Gas Cooking Appliances,Built-in Hotplate 1 Burner,GERMAN POOL,GP12-1-LG,GLASS TOP PANEL,The People's Republic of China,German Pool (Hong Kong) Ltd.,2773 2812,2025-02-15


In [None]:
# Check to see if you combined similar applicants correctly in "Applicant"


In [None]:
# Create a new DataFrame that looks into a specific Place of Manufacture


In [None]:
# Create a new DataFrame that looks into a specific Place of Manufacture
