# Games

The following notebook contains an ETL process to which a file containing data from the video games platform STEAM was subjected. The file contains information about different products available in the STEAM platform, such as: publisher, name, release date, tags, etc.

In [31]:
import pandas as pd
import numpy as np
import ast
from etl_functions import general_information, get_year, column_comparator, explode_column

In [10]:
df_games=pd.read_json("data/output_steam_games.json", lines=True)

In [11]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,title,url,release_date,tags,reviews_url,specs,price,early_access,id,developer
0,,,,,,,,,,,,,
1,,,,,,,,,,,,,
2,,,,,,,,,,,,,
3,,,,,,,,,,,,,
4,,,,,,,,,,,,,


In [12]:
df_games.tail(5)

Unnamed: 0,publisher,genres,app_name,title,url,release_date,tags,reviews_url,specs,price,early_access,id,developer
120440,Ghost_RUS Games,"[Casual, Indie, Simulation, Strategy]",Colony On Mars,Colony On Mars,http://store.steampowered.com/app/773640/Colon...,2018-01-04,"[Strategy, Indie, Casual, Simulation]",http://steamcommunity.com/app/773640/reviews/?...,"[Single-player, Steam Achievements]",1.99,0.0,773640.0,"Nikita ""Ghost_RUS"""
120441,Sacada,"[Casual, Indie, Strategy]",LOGistICAL: South Africa,LOGistICAL: South Africa,http://store.steampowered.com/app/733530/LOGis...,2018-01-04,"[Strategy, Indie, Casual]",http://steamcommunity.com/app/733530/reviews/?...,"[Single-player, Steam Achievements, Steam Clou...",4.99,0.0,733530.0,Sacada
120442,Laush Studio,"[Indie, Racing, Simulation]",Russian Roads,Russian Roads,http://store.steampowered.com/app/610660/Russi...,2018-01-04,"[Indie, Simulation, Racing]",http://steamcommunity.com/app/610660/reviews/?...,"[Single-player, Steam Achievements, Steam Trad...",1.99,0.0,610660.0,Laush Dmitriy Sergeevich
120443,SIXNAILS,"[Casual, Indie]",EXIT 2 - Directions,EXIT 2 - Directions,http://store.steampowered.com/app/658870/EXIT_...,2017-09-02,"[Indie, Casual, Puzzle, Singleplayer, Atmosphe...",http://steamcommunity.com/app/658870/reviews/?...,"[Single-player, Steam Achievements, Steam Cloud]",4.99,0.0,658870.0,"xropi,stev3ns"
120444,,,Maze Run VR,,http://store.steampowered.com/app/681550/Maze_...,,"[Early Access, Adventure, Indie, Action, Simul...",http://steamcommunity.com/app/681550/reviews/?...,"[Single-player, Stats, Steam Leaderboards, HTC...",4.99,1.0,681550.0,


In [13]:
df_games.shape

(120445, 13)

In [14]:
general_information(df_games)

Unnamed: 0,column,data_type,missing_values,missing_values_percentage
0,publisher,<class 'str'>,192724,1.6
1,genres,<class 'str'>,183186,1.52
2,app_name,<class 'str'>,176624,1.47
3,title,<class 'str'>,180720,1.5
4,url,<class 'str'>,176620,1.47
5,release_date,<class 'str'>,180754,1.5
6,tags,<class 'str'>,176946,1.47
7,reviews_url,<class 'str'>,176624,1.47
8,specs,<class 'str'>,177960,1.48
9,price,<class 'str'>,179374,1.49


In [15]:
df_games.dropna(inplace=True,ignore_index=True)

In [16]:
general_information(df_games)

Unnamed: 0,column,data_type,missing_values,missing_values_percentage
0,publisher,<class 'str'>,0,0.0
1,genres,<class 'str'>,0,0.0
2,app_name,<class 'str'>,0,0.0
3,title,<class 'str'>,0,0.0
4,url,<class 'str'>,0,0.0
5,release_date,<class 'str'>,0,0.0
6,tags,<class 'str'>,0,0.0
7,reviews_url,<class 'str'>,0,0.0
8,specs,<class 'str'>,0,0.0
9,price,<class 'str'>,0,0.0


In [17]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,title,url,release_date,tags,reviews_url,specs,price,early_access,id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,Lost Summoner Kitty,http://store.steampowered.com/app/761140/Lost_...,2018-01-04,"[Strategy, Action, Indie, Casual, Simulation]",http://steamcommunity.com/app/761140/reviews/?...,[Single-player],4.99,0.0,761140.0,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,Ironbound,http://store.steampowered.com/app/643980/Ironb...,2018-01-04,"[Free to Play, Strategy, Indie, RPG, Card Game...",http://steamcommunity.com/app/643980/reviews/?...,"[Single-player, Multi-player, Online Multi-Pla...",Free To Play,0.0,643980.0,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,Real Pool 3D - Poolians,http://store.steampowered.com/app/670290/Real_...,2017-07-24,"[Free to Play, Simulation, Sports, Casual, Ind...",http://steamcommunity.com/app/670290/reviews/?...,"[Single-player, Multi-player, Online Multi-Pla...",Free to Play,0.0,670290.0,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,弹炸人2222,http://store.steampowered.com/app/767400/2222/,2017-12-07,"[Action, Adventure, Casual]",http://steamcommunity.com/app/767400/reviews/?...,[Single-player],0.99,0.0,767400.0,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,Battle Royale Trainer,http://store.steampowered.com/app/772540/Battl...,2018-01-04,"[Action, Adventure, Simulation, FPS, Shooter, ...",http://steamcommunity.com/app/772540/reviews/?...,"[Single-player, Steam Achievements]",3.99,0.0,772540.0,Trickjump Games Ltd


In [18]:
df_games.drop(columns=["url","reviews_url"],inplace=True)

In [19]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,title,release_date,tags,specs,price,early_access,id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,Lost Summoner Kitty,2018-01-04,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0.0,761140.0,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,Ironbound,2018-01-04,"[Free to Play, Strategy, Indie, RPG, Card Game...","[Single-player, Multi-player, Online Multi-Pla...",Free To Play,0.0,643980.0,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,Real Pool 3D - Poolians,2017-07-24,"[Free to Play, Simulation, Sports, Casual, Ind...","[Single-player, Multi-player, Online Multi-Pla...",Free to Play,0.0,670290.0,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,弹炸人2222,2017-12-07,"[Action, Adventure, Casual]",[Single-player],0.99,0.0,767400.0,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,Battle Royale Trainer,2018-01-04,"[Action, Adventure, Simulation, FPS, Shooter, ...","[Single-player, Steam Achievements]",3.99,0.0,772540.0,Trickjump Games Ltd


In [20]:
column_comparator(df_games,"app_name","title")

'The percentage of common values for the columns app_name and title is 98.44%'

In [21]:
df_games.drop(columns={"title"},inplace=True)

In [22]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_date,tags,specs,price,early_access,id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,2018-01-04,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0.0,761140.0,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,2018-01-04,"[Free to Play, Strategy, Indie, RPG, Card Game...","[Single-player, Multi-player, Online Multi-Pla...",Free To Play,0.0,643980.0,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,2017-07-24,"[Free to Play, Simulation, Sports, Casual, Ind...","[Single-player, Multi-player, Online Multi-Pla...",Free to Play,0.0,670290.0,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,2017-12-07,"[Action, Adventure, Casual]",[Single-player],0.99,0.0,767400.0,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,2018-01-04,"[Action, Adventure, Simulation, FPS, Shooter, ...","[Single-player, Steam Achievements]",3.99,0.0,772540.0,Trickjump Games Ltd


In [23]:
column_comparator(df_games,"genres","tags")

'The percentage of common values for the columns genres and tags is 22.21%'

In [24]:
column_comparator(df_games,"tags","specs")

'The percentage of common values for the columns tags and specs is 0.0%'

In [25]:
column_comparator(df_games,"publisher","developer")

'The percentage of common values for the columns publisher and developer is 51.17%'

In [26]:
df_games.rename(columns={"id":"item_id"},inplace=True)

In [27]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_date,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,2018-01-04,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0.0,761140.0,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,2018-01-04,"[Free to Play, Strategy, Indie, RPG, Card Game...","[Single-player, Multi-player, Online Multi-Pla...",Free To Play,0.0,643980.0,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,2017-07-24,"[Free to Play, Simulation, Sports, Casual, Ind...","[Single-player, Multi-player, Online Multi-Pla...",Free to Play,0.0,670290.0,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,2017-12-07,"[Action, Adventure, Casual]",[Single-player],0.99,0.0,767400.0,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,2018-01-04,"[Action, Adventure, Simulation, FPS, Shooter, ...","[Single-player, Steam Achievements]",3.99,0.0,772540.0,Trickjump Games Ltd


In [28]:
df_games["item_id"]=df_games["item_id"].astype("int64")

In [29]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_date,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,2018-01-04,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0.0,761140,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,2018-01-04,"[Free to Play, Strategy, Indie, RPG, Card Game...","[Single-player, Multi-player, Online Multi-Pla...",Free To Play,0.0,643980,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,2017-07-24,"[Free to Play, Simulation, Sports, Casual, Ind...","[Single-player, Multi-player, Online Multi-Pla...",Free to Play,0.0,670290,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,2017-12-07,"[Action, Adventure, Casual]",[Single-player],0.99,0.0,767400,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,2018-01-04,"[Action, Adventure, Simulation, FPS, Shooter, ...","[Single-player, Steam Achievements]",3.99,0.0,772540,Trickjump Games Ltd


In [34]:
df_games["release_date"]=df_games["release_date"].apply(get_year)

In [35]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_date,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0.0,761140,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,2018,"[Free to Play, Strategy, Indie, RPG, Card Game...","[Single-player, Multi-player, Online Multi-Pla...",Free To Play,0.0,643980,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,2017,"[Free to Play, Simulation, Sports, Casual, Ind...","[Single-player, Multi-player, Online Multi-Pla...",Free to Play,0.0,670290,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,2017,"[Action, Adventure, Casual]",[Single-player],0.99,0.0,767400,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,2018,"[Action, Adventure, Simulation, FPS, Shooter, ...","[Single-player, Steam Achievements]",3.99,0.0,772540,Trickjump Games Ltd


In [36]:
df_games.rename(columns={"release_date":"release_year"},inplace=True)

In [37]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_year,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0.0,761140,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,2018,"[Free to Play, Strategy, Indie, RPG, Card Game...","[Single-player, Multi-player, Online Multi-Pla...",Free To Play,0.0,643980,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,2017,"[Free to Play, Simulation, Sports, Casual, Ind...","[Single-player, Multi-player, Online Multi-Pla...",Free to Play,0.0,670290,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,2017,"[Action, Adventure, Casual]",[Single-player],0.99,0.0,767400,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,2018,"[Action, Adventure, Simulation, FPS, Shooter, ...","[Single-player, Steam Achievements]",3.99,0.0,772540,Trickjump Games Ltd


In [38]:
df_games["early_access"]=df_games["early_access"].astype("int64")

In [39]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_year,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0,761140,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,2018,"[Free to Play, Strategy, Indie, RPG, Card Game...","[Single-player, Multi-player, Online Multi-Pla...",Free To Play,0,643980,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,2017,"[Free to Play, Simulation, Sports, Casual, Ind...","[Single-player, Multi-player, Online Multi-Pla...",Free to Play,0,670290,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,2017,"[Action, Adventure, Casual]",[Single-player],0.99,0,767400,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,2018,"[Action, Adventure, Simulation, FPS, Shooter, ...","[Single-player, Steam Achievements]",3.99,0,772540,Trickjump Games Ltd


In [40]:
df_games["price"].unique()

array([4.99, 'Free To Play', 'Free to Play', 0.99, 3.99, 18.99, 29.99,
       10.99, 2.99, 1.5899999999999999, 14.99, 1.99, 59.99, 9.99, 6.99,
       7.99, 39.99, 'Free', 19.99, 7.49, 8.99, 12.99, 5.99, 2.49, 15.99,
       1.25, 24.99, 17.99, 61.99, 3.49, 11.99, 13.99, 'Free Demo',
       'Play for Free!', 34.99, 1.49, 32.99, 99.99, 14.95, 69.99, 16.99,
       79.99, 49.99, 13.98, 149.99, 771.71, 'Install Now', 21.99, 89.99,
       'Play WARMACHINE: Tactics Demo', 0.98, 139.92, 4.29, 'Free Mod',
       54.99, 64.99, 74.99, 0.89, 0.5, 'Play Now', 299.99, 1.29, 119.99,
       44.99, 3.0, 15.0, 1.3900000000000001, 'Free HITMAN™ Holiday Pack',
       2.0, 4.0, 1.9500000000000002, 1.5, 6.66, 26.99, 399.99, 31.99,
       20.0, 40.0, 5.0, 3.33, 38.85, 71.7, 995.0, 5.49, 27.49, 3.39, 6.0,
       19.95, 20.99, 499.99, 27.99, 199.99, 4.68, 131.4, 44.98, 202.76,
       2.3, 0.9500000000000001, 36.99, 172.24, 249.99, 2.9699999999999998,
       10.96, 2.66, 6.48, 10.0, 1.0, 11.15, 'Play the Demo', 

In [41]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Free to Play','0',regex=True)

In [42]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_year,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0,761140,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,2018,"[Free to Play, Strategy, Indie, RPG, Card Game...","[Single-player, Multi-player, Online Multi-Pla...",Free To Play,0,643980,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,2017,"[Free to Play, Simulation, Sports, Casual, Ind...","[Single-player, Multi-player, Online Multi-Pla...",0,0,670290,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,2017,"[Action, Adventure, Casual]",[Single-player],0.99,0,767400,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,2018,"[Action, Adventure, Simulation, FPS, Shooter, ...","[Single-player, Steam Achievements]",3.99,0,772540,Trickjump Games Ltd


In [43]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Free To Play','0',regex=True)

In [44]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_year,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0,761140,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,2018,"[Free to Play, Strategy, Indie, RPG, Card Game...","[Single-player, Multi-player, Online Multi-Pla...",0.0,0,643980,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,2017,"[Free to Play, Simulation, Sports, Casual, Ind...","[Single-player, Multi-player, Online Multi-Pla...",0.0,0,670290,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,2017,"[Action, Adventure, Casual]",[Single-player],0.99,0,767400,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,2018,"[Action, Adventure, Simulation, FPS, Shooter, ...","[Single-player, Steam Achievements]",3.99,0,772540,Trickjump Games Ltd


In [45]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Play for Free!','0',regex=True)

In [46]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Free!','0',regex=True)

In [47]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Free','0',regex=True)

In [48]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Install Now','None',regex=True)

In [49]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Play WARMACHINE: Tactics Demo','None',regex=True)

In [50]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'0 Demo','None',regex=True)

In [51]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'0 HITMAN™ Holiday Pack','None',regex=True)

In [52]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Third-party','None',regex=True)

In [53]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Install Now','None',regex=True)

In [54]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Play the Demo','None',regex=True)

In [55]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'0 Mod','None',regex=True)

In [56]:
df_games["price"]=df_games["price"].astype(str).str.replace(r'Play Now','None',regex=True)

In [57]:
df_games["price"].unique()

array(['4.99', '0', '0.99', '3.99', '18.99', '29.99', '10.99', '2.99',
       '1.5899999999999999', '14.99', '1.99', '59.99', '9.99', '6.99',
       '7.99', '39.99', '19.99', '7.49', '8.99', '12.99', '5.99', '2.49',
       '15.99', '1.25', '24.99', '17.99', '61.99', '3.49', '11.99',
       '13.99', 'None', '34.99', '1.49', '32.99', '99.99', '14.95',
       '69.99', '16.99', '79.99', '49.99', '13.98', '149.99', '771.71',
       '21.99', '89.99', '0.98', '139.92', '4.29', '54.99', '64.99',
       '74.99', '0.89', '0.5', '299.99', '1.29', '119.99', '44.99', '3.0',
       '15.0', '1.3900000000000001', '2.0', '4.0', '1.9500000000000002',
       '1.5', '6.66', '26.99', '399.99', '31.99', '20.0', '40.0', '5.0',
       '3.33', '38.85', '71.7', '995.0', '5.49', '27.49', '3.39', '6.0',
       '19.95', '20.99', '499.99', '27.99', '199.99', '4.68', '131.4',
       '44.98', '202.76', '2.3', '0.9500000000000001', '36.99', '172.24',
       '249.99', '2.9699999999999998', '10.96', '2.66', '6.48', '10.

In [58]:
df_games["price"].replace("None",np.nan,inplace=True)

In [59]:
df_games["price"].unique()

array(['4.99', '0', '0.99', '3.99', '18.99', '29.99', '10.99', '2.99',
       '1.5899999999999999', '14.99', '1.99', '59.99', '9.99', '6.99',
       '7.99', '39.99', '19.99', '7.49', '8.99', '12.99', '5.99', '2.49',
       '15.99', '1.25', '24.99', '17.99', '61.99', '3.49', '11.99',
       '13.99', nan, '34.99', '1.49', '32.99', '99.99', '14.95', '69.99',
       '16.99', '79.99', '49.99', '13.98', '149.99', '771.71', '21.99',
       '89.99', '0.98', '139.92', '4.29', '54.99', '64.99', '74.99',
       '0.89', '0.5', '299.99', '1.29', '119.99', '44.99', '3.0', '15.0',
       '1.3900000000000001', '2.0', '4.0', '1.9500000000000002', '1.5',
       '6.66', '26.99', '399.99', '31.99', '20.0', '40.0', '5.0', '3.33',
       '38.85', '71.7', '995.0', '5.49', '27.49', '3.39', '6.0', '19.95',
       '20.99', '499.99', '27.99', '199.99', '4.68', '131.4', '44.98',
       '202.76', '2.3', '0.9500000000000001', '36.99', '172.24', '249.99',
       '2.9699999999999998', '10.96', '2.66', '6.48', '10.0',

In [60]:
df_games["price"]=df_games["price"].astype("float64")

In [61]:
df_games["price"].unique()

array([4.9900e+00, 0.0000e+00, 9.9000e-01, 3.9900e+00, 1.8990e+01,
       2.9990e+01, 1.0990e+01, 2.9900e+00, 1.5900e+00, 1.4990e+01,
       1.9900e+00, 5.9990e+01, 9.9900e+00, 6.9900e+00, 7.9900e+00,
       3.9990e+01, 1.9990e+01, 7.4900e+00, 8.9900e+00, 1.2990e+01,
       5.9900e+00, 2.4900e+00, 1.5990e+01, 1.2500e+00, 2.4990e+01,
       1.7990e+01, 6.1990e+01, 3.4900e+00, 1.1990e+01, 1.3990e+01,
              nan, 3.4990e+01, 1.4900e+00, 3.2990e+01, 9.9990e+01,
       1.4950e+01, 6.9990e+01, 1.6990e+01, 7.9990e+01, 4.9990e+01,
       1.3980e+01, 1.4999e+02, 7.7171e+02, 2.1990e+01, 8.9990e+01,
       9.8000e-01, 1.3992e+02, 4.2900e+00, 5.4990e+01, 6.4990e+01,
       7.4990e+01, 8.9000e-01, 5.0000e-01, 2.9999e+02, 1.2900e+00,
       1.1999e+02, 4.4990e+01, 3.0000e+00, 1.5000e+01, 1.3900e+00,
       2.0000e+00, 4.0000e+00, 1.9500e+00, 1.5000e+00, 6.6600e+00,
       2.6990e+01, 3.9999e+02, 3.1990e+01, 2.0000e+01, 4.0000e+01,
       5.0000e+00, 3.3300e+00, 3.8850e+01, 7.1700e+01, 9.9500e

In [62]:
df_games["price"]=df_games["price"].round(2)

In [63]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_year,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0,761140,Kotoshiro
1,"Making Fun, Inc.","[Free to Play, Indie, RPG, Strategy]",Ironbound,2018,"[Free to Play, Strategy, Indie, RPG, Card Game...","[Single-player, Multi-player, Online Multi-Pla...",0.0,0,643980,Secret Level SRL
2,Poolians.com,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,2017,"[Free to Play, Simulation, Sports, Casual, Ind...","[Single-player, Multi-player, Online Multi-Pla...",0.0,0,670290,Poolians.com
3,彼岸领域,"[Action, Adventure, Casual]",弹炸人2222,2017,"[Action, Adventure, Casual]",[Single-player],0.99,0,767400,彼岸领域
4,Trickjump Games Ltd,"[Action, Adventure, Simulation]",Battle Royale Trainer,2018,"[Action, Adventure, Simulation, FPS, Shooter, ...","[Single-player, Steam Achievements]",3.99,0,772540,Trickjump Games Ltd


In [65]:
df_games=explode_column(df_games,"genres")

In [66]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_year,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,Action,Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0,761140,Kotoshiro
1,Kotoshiro,Casual,Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0,761140,Kotoshiro
2,Kotoshiro,Indie,Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0,761140,Kotoshiro
3,Kotoshiro,Simulation,Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0,761140,Kotoshiro
4,Kotoshiro,Strategy,Lost Summoner Kitty,2018,"[Strategy, Action, Indie, Casual, Simulation]",[Single-player],4.99,0,761140,Kotoshiro


In [67]:
df_games=explode_column(df_games,"tags")

In [68]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_year,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,Action,Lost Summoner Kitty,2018,Strategy,[Single-player],4.99,0,761140,Kotoshiro
1,Kotoshiro,Action,Lost Summoner Kitty,2018,Action,[Single-player],4.99,0,761140,Kotoshiro
2,Kotoshiro,Action,Lost Summoner Kitty,2018,Indie,[Single-player],4.99,0,761140,Kotoshiro
3,Kotoshiro,Action,Lost Summoner Kitty,2018,Casual,[Single-player],4.99,0,761140,Kotoshiro
4,Kotoshiro,Action,Lost Summoner Kitty,2018,Simulation,[Single-player],4.99,0,761140,Kotoshiro


In [69]:
df_games=explode_column(df_games,"specs")

In [70]:
df_games.head(5)

Unnamed: 0,publisher,genres,app_name,release_year,tags,specs,price,early_access,item_id,developer
0,Kotoshiro,Action,Lost Summoner Kitty,2018,Strategy,Single-player,4.99,0,761140,Kotoshiro
1,Kotoshiro,Action,Lost Summoner Kitty,2018,Action,Single-player,4.99,0,761140,Kotoshiro
2,Kotoshiro,Action,Lost Summoner Kitty,2018,Indie,Single-player,4.99,0,761140,Kotoshiro
3,Kotoshiro,Action,Lost Summoner Kitty,2018,Casual,Single-player,4.99,0,761140,Kotoshiro
4,Kotoshiro,Action,Lost Summoner Kitty,2018,Simulation,Single-player,4.99,0,761140,Kotoshiro


In [71]:
#Saving the final file
df_games.to_csv("games_cleaned.csv",index=False)