In [1]:
import pandas as pd 
import numpy as np
import json
import ast
import gzip
from datetime import date
from textblob import TextBlob

In [5]:
rows = []

with open("australian_user_reviews.json", encoding='MacRoman') as f:
    for line in f.readlines():
        rows.append(ast.literal_eval(line))

df_reviews = pd.DataFrame(rows)

In [3]:
df_reviews["reviews"] = df_reviews["reviews"].astype("string")
df_reviews.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 25799 entries, 0 to 25798
Data columns (total 3 columns):
 #   Column    Non-Null Count  Dtype 
---  ------    --------------  ----- 
 0   user_id   25799 non-null  object
 1   user_url  25799 non-null  object
 2   reviews   25799 non-null  string
dtypes: object(2), string(1)
memory usage: 604.8+ KB


In [7]:
df_reviews["reviews"].iloc[0]

[{'funny': '',
  'posted': 'Posted November 5, 2011.',
  'last_edited': '',
  'item_id': '1250',
  'helpful': 'No ratings yet',
  'recommend': True,
  'review': 'Simple yet with great replayability. In my opinion does "zombie" hordes and team work better than left 4 dead plus has a global leveling system. Alot of down to earth "zombie" splattering fun for the whole family. Amazed this sort of FPS is so rare.'},
 {'funny': '',
  'posted': 'Posted July 15, 2011.',
  'last_edited': '',
  'item_id': '22200',
  'helpful': 'No ratings yet',
  'recommend': True,
  'review': "It's unique and worth a playthrough."},
 {'funny': '',
  'posted': 'Posted April 21, 2011.',
  'last_edited': '',
  'item_id': '43110',
  'helpful': 'No ratings yet',
  'recommend': True,
  'review': 'Great atmosphere. The gunplay can be a bit chunky at times but at the end of the day this game is definitely worth it and I hope they do a sequel...so buy the game so I get a sequel!'}]

In [8]:
def analyze_sentiment(review_list):
    sentiments = []
    for review_dict in review_list:
        review_text = review_dict.get('review', '')  # Extrae el texto de la revisión
        analysis = TextBlob(review_text)
        if analysis.sentiment.polarity > 0:
            sentiments.append(2)  # Sentimiento positivo
        elif analysis.sentiment.polarity < 0:
            sentiments.append(0)  # Sentimiento negativo
        else:
            sentiments.append(1)  # Sentimiento neutral
    return sentiments

# Aplica la función para analizar el sentimiento a la columna 'reviews' que contiene listas de diccionarios
df_reviews['polaridad'] = df_reviews['reviews'].apply(analyze_sentiment)


In [10]:
df_reviews

Unnamed: 0,user_id,user_url,reviews,polaridad
0,76561197970982479,http://steamcommunity.com/profiles/76561197970...,"[{'funny': '', 'posted': 'Posted November 5, 2...","[2, 2, 2]"
1,js41637,http://steamcommunity.com/id/js41637,"[{'funny': '', 'posted': 'Posted June 24, 2014...","[2, 0, 0]"
2,evcentric,http://steamcommunity.com/id/evcentric,"[{'funny': '', 'posted': 'Posted February 3.',...","[2, 2, 2, 0, 2, 2]"
3,doctr,http://steamcommunity.com/id/doctr,"[{'funny': '', 'posted': 'Posted October 14, 2...","[2, 2, 2, 2, 0, 2]"
4,maplemage,http://steamcommunity.com/id/maplemage,"[{'funny': '3 people found this review funny',...","[1, 2, 2, 2]"
...,...,...,...,...
25794,76561198306599751,http://steamcommunity.com/profiles/76561198306...,"[{'funny': '', 'posted': 'Posted May 31.', 'la...",[2]
25795,Ghoustik,http://steamcommunity.com/id/Ghoustik,"[{'funny': '', 'posted': 'Posted June 17.', 'l...",[1]
25796,76561198310819422,http://steamcommunity.com/profiles/76561198310...,"[{'funny': '1 person found this review funny',...",[1]
25797,76561198312638244,http://steamcommunity.com/profiles/76561198312...,"[{'funny': '', 'posted': 'Posted July 21.', 'l...","[2, 2, 2, 2]"


In [2]:
data_list= []
file_path = "australian_users_items.json"

with open(file_path,"r", encoding='utf-8') as archivo:
    for line in archivo:
        try:
            json_data = ast.literal_eval(line)
            data_list.append(json_data)
        except ValueError as e:
            print(f"Error en la linea:{line}")
            continue  

df_items = pd.DataFrame(data_list)
df_items.head()


Unnamed: 0,user_id,items_count,steam_id,user_url,items
0,76561197970982479,277,76561197970982479,http://steamcommunity.com/profiles/76561197970...,"[{'item_id': '10', 'item_name': 'Counter-Strik..."
1,js41637,888,76561198035864385,http://steamcommunity.com/id/js41637,"[{'item_id': '10', 'item_name': 'Counter-Strik..."
2,evcentric,137,76561198007712555,http://steamcommunity.com/id/evcentric,"[{'item_id': '1200', 'item_name': 'Red Orchest..."
3,Riot-Punch,328,76561197963445855,http://steamcommunity.com/id/Riot-Punch,"[{'item_id': '10', 'item_name': 'Counter-Strik..."
4,doctr,541,76561198002099482,http://steamcommunity.com/id/doctr,"[{'item_id': '300', 'item_name': 'Day of Defea..."


In [3]:
df_items["items"].iloc[0]

[{'item_id': '10',
  'item_name': 'Counter-Strike',
  'playtime_forever': 6,
  'playtime_2weeks': 0},
 {'item_id': '20',
  'item_name': 'Team Fortress Classic',
  'playtime_forever': 0,
  'playtime_2weeks': 0},
 {'item_id': '30',
  'item_name': 'Day of Defeat',
  'playtime_forever': 7,
  'playtime_2weeks': 0},
 {'item_id': '40',
  'item_name': 'Deathmatch Classic',
  'playtime_forever': 0,
  'playtime_2weeks': 0},
 {'item_id': '50',
  'item_name': 'Half-Life: Opposing Force',
  'playtime_forever': 0,
  'playtime_2weeks': 0},
 {'item_id': '60',
  'item_name': 'Ricochet',
  'playtime_forever': 0,
  'playtime_2weeks': 0},
 {'item_id': '70',
  'item_name': 'Half-Life',
  'playtime_forever': 0,
  'playtime_2weeks': 0},
 {'item_id': '130',
  'item_name': 'Half-Life: Blue Shift',
  'playtime_forever': 0,
  'playtime_2weeks': 0},
 {'item_id': '300',
  'item_name': 'Day of Defeat: Source',
  'playtime_forever': 4733,
  'playtime_2weeks': 0},
 {'item_id': '240',
  'item_name': 'Counter-Strike: S

In [12]:

compressed_file = (r'C:\Users\pao_i\Downloads\steam_games.json.gz')

with gzip.open(compressed_file, 'rb') as f:
    data = f.read()

json_str = data.decode('utf-8')
data_list = json_str.strip().split('\n')

dfs = []
for item in data_list:
    data_dict = json.loads(item)
    df = pd.DataFrame([data_dict])
    dfs.append(df)

final_df = pd.concat(dfs, ignore_index=True)

final_df  

Unnamed: 0,publisher,genres,app_name,title,url,release_date,tags,reviews_url,specs,price,early_access,id,developer
0,,,,,,,,,,,,,
1,,,,,,,,,,,,,
2,,,,,,,,,,,,,
3,,,,,,,,,,,,,
4,,,,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...
120440,Ghost_RUS Games,"[Casual, Indie, Simulation, Strategy]",Colony On Mars,Colony On Mars,http://store.steampowered.com/app/773640/Colon...,2018-01-04,"[Strategy, Indie, Casual, Simulation]",http://steamcommunity.com/app/773640/reviews/?...,"[Single-player, Steam Achievements]",1.99,0.0,773640,"Nikita ""Ghost_RUS"""
120441,Sacada,"[Casual, Indie, Strategy]",LOGistICAL: South Africa,LOGistICAL: South Africa,http://store.steampowered.com/app/733530/LOGis...,2018-01-04,"[Strategy, Indie, Casual]",http://steamcommunity.com/app/733530/reviews/?...,"[Single-player, Steam Achievements, Steam Clou...",4.99,0.0,733530,Sacada
120442,Laush Studio,"[Indie, Racing, Simulation]",Russian Roads,Russian Roads,http://store.steampowered.com/app/610660/Russi...,2018-01-04,"[Indie, Simulation, Racing]",http://steamcommunity.com/app/610660/reviews/?...,"[Single-player, Steam Achievements, Steam Trad...",1.99,0.0,610660,Laush Dmitriy Sergeevich
120443,SIXNAILS,"[Casual, Indie]",EXIT 2 - Directions,EXIT 2 - Directions,http://store.steampowered.com/app/658870/EXIT_...,2017-09-02,"[Indie, Casual, Puzzle, Singleplayer, Atmosphe...",http://steamcommunity.com/app/658870/reviews/?...,"[Single-player, Steam Achievements, Steam Cloud]",4.99,0.0,658870,"xropi,stev3ns"


In [22]:
df_games = final_df
df_games_2 = df_games
df_games.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 120445 entries, 0 to 120444
Data columns (total 13 columns):
 #   Column        Non-Null Count   Dtype 
---  ------        --------------   ----- 
 0   publisher     24083 non-null   object
 1   genres        120445 non-null  object
 2   app_name      32133 non-null   object
 3   title         30085 non-null   object
 4   url           32135 non-null   object
 5   release_date  30068 non-null   object
 6   tags          31972 non-null   object
 7   reviews_url   32133 non-null   object
 8   specs         31465 non-null   object
 9   price         30758 non-null   object
 10  early_access  32135 non-null   object
 11  id            32133 non-null   object
 12  developer     28836 non-null   object
dtypes: object(13)
memory usage: 11.9+ MB


primero realizo un etl a los 3 data frames

In [23]:
df_games.drop(["publisher","tags","title","early_access","specs","url"],axis=1,inplace=True)

In [24]:
df_games.dropna(inplace=True)

In [25]:
df_games['genres'] = df_games['genres'].apply(lambda x: x if isinstance(x, list) else [x])

In [26]:
df_games['genres'] = df_games['genres'].apply(lambda x: [str(genre) for genre in x])

In [27]:
df_games = df_games.explode('genres')

In [28]:
df_dummies = pd.get_dummies(df_games['genres'], prefix='', prefix_sep='')

In [29]:
df_dummies_combined = df_dummies.groupby(level=0).max()

In [30]:
df_dummies_combined

Unnamed: 0,Accounting,Action,Adventure,Animation &amp; Modeling,Audio Production,Casual,Design &amp; Illustration,Early Access,Education,Free to Play,...,RPG,Racing,Simulation,Software Training,Sports,Strategy,Utilities,Video Production,Web Publishing,nan
88310,False,True,False,False,False,True,False,False,False,False,...,False,False,True,False,False,True,False,False,False,False
88311,False,False,False,False,False,False,False,False,False,True,...,True,False,False,False,False,True,False,False,False,False
88312,False,False,False,False,False,True,False,False,False,True,...,False,False,True,False,True,False,False,False,False,False
88313,False,True,True,False,False,True,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
88315,False,True,True,False,False,False,False,False,False,False,...,False,False,True,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
120439,False,True,True,False,False,True,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
120440,False,False,False,False,False,True,False,False,False,False,...,False,False,True,False,False,True,False,False,False,False
120441,False,False,False,False,False,True,False,False,False,False,...,False,False,False,False,False,True,False,False,False,False
120442,False,False,False,False,False,False,False,False,False,False,...,False,True,True,False,False,False,False,False,False,False


In [31]:
df_games_2 = pd.concat([df_games_2,df_dummies_combined],axis=1)

In [32]:
df_games_2

Unnamed: 0,genres,app_name,release_date,reviews_url,price,id,developer,Accounting,Action,Adventure,...,RPG,Racing,Simulation,Software Training,Sports,Strategy,Utilities,Video Production,Web Publishing,nan
88310,"[Action, Casual, Indie, Simulation, Strategy]",Lost Summoner Kitty,2018-01-04,http://steamcommunity.com/app/761140/reviews/?...,4.99,761140,Kotoshiro,False,True,False,...,False,False,True,False,False,True,False,False,False,False
88311,"[Free to Play, Indie, RPG, Strategy]",Ironbound,2018-01-04,http://steamcommunity.com/app/643980/reviews/?...,Free To Play,643980,Secret Level SRL,False,False,False,...,True,False,False,False,False,True,False,False,False,False
88312,"[Casual, Free to Play, Indie, Simulation, Sports]",Real Pool 3D - Poolians,2017-07-24,http://steamcommunity.com/app/670290/reviews/?...,Free to Play,670290,Poolians.com,False,False,False,...,False,False,True,False,True,False,False,False,False,False
88313,"[Action, Adventure, Casual]",弹炸人2222,2017-12-07,http://steamcommunity.com/app/767400/reviews/?...,0.99,767400,彼岸领域,False,True,True,...,False,False,False,False,False,False,False,False,False,False
88315,"[Action, Adventure, Simulation]",Battle Royale Trainer,2018-01-04,http://steamcommunity.com/app/772540/reviews/?...,3.99,772540,Trickjump Games Ltd,False,True,True,...,False,False,True,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
120439,"[Action, Adventure, Casual, Indie]",Kebab it Up!,2018-01-04,http://steamcommunity.com/app/745400/reviews/?...,1.99,745400,Bidoniera Games,False,True,True,...,False,False,False,False,False,False,False,False,False,False
120440,"[Casual, Indie, Simulation, Strategy]",Colony On Mars,2018-01-04,http://steamcommunity.com/app/773640/reviews/?...,1.99,773640,"Nikita ""Ghost_RUS""",False,False,False,...,False,False,True,False,False,True,False,False,False,False
120441,"[Casual, Indie, Strategy]",LOGistICAL: South Africa,2018-01-04,http://steamcommunity.com/app/733530/reviews/?...,4.99,733530,Sacada,False,False,False,...,False,False,False,False,False,True,False,False,False,False
120442,"[Indie, Racing, Simulation]",Russian Roads,2018-01-04,http://steamcommunity.com/app/610660/reviews/?...,1.99,610660,Laush Dmitriy Sergeevich,False,False,False,...,False,True,True,False,False,False,False,False,False,False


In [33]:
df_games_2.drop(columns=("genres"),axis=1,inplace=True)

In [34]:
df_games_2

Unnamed: 0,app_name,release_date,reviews_url,price,id,developer,Accounting,Action,Adventure,Animation &amp; Modeling,...,RPG,Racing,Simulation,Software Training,Sports,Strategy,Utilities,Video Production,Web Publishing,nan
88310,Lost Summoner Kitty,2018-01-04,http://steamcommunity.com/app/761140/reviews/?...,4.99,761140,Kotoshiro,False,True,False,False,...,False,False,True,False,False,True,False,False,False,False
88311,Ironbound,2018-01-04,http://steamcommunity.com/app/643980/reviews/?...,Free To Play,643980,Secret Level SRL,False,False,False,False,...,True,False,False,False,False,True,False,False,False,False
88312,Real Pool 3D - Poolians,2017-07-24,http://steamcommunity.com/app/670290/reviews/?...,Free to Play,670290,Poolians.com,False,False,False,False,...,False,False,True,False,True,False,False,False,False,False
88313,弹炸人2222,2017-12-07,http://steamcommunity.com/app/767400/reviews/?...,0.99,767400,彼岸领域,False,True,True,False,...,False,False,False,False,False,False,False,False,False,False
88315,Battle Royale Trainer,2018-01-04,http://steamcommunity.com/app/772540/reviews/?...,3.99,772540,Trickjump Games Ltd,False,True,True,False,...,False,False,True,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
120439,Kebab it Up!,2018-01-04,http://steamcommunity.com/app/745400/reviews/?...,1.99,745400,Bidoniera Games,False,True,True,False,...,False,False,False,False,False,False,False,False,False,False
120440,Colony On Mars,2018-01-04,http://steamcommunity.com/app/773640/reviews/?...,1.99,773640,"Nikita ""Ghost_RUS""",False,False,False,False,...,False,False,True,False,False,True,False,False,False,False
120441,LOGistICAL: South Africa,2018-01-04,http://steamcommunity.com/app/733530/reviews/?...,4.99,733530,Sacada,False,False,False,False,...,False,False,False,False,False,True,False,False,False,False
120442,Russian Roads,2018-01-04,http://steamcommunity.com/app/610660/reviews/?...,1.99,610660,Laush Dmitriy Sergeevich,False,False,False,False,...,False,True,True,False,False,False,False,False,False,False


In [35]:
df_games_2.info()

<class 'pandas.core.frame.DataFrame'>
Index: 27596 entries, 88310 to 120443
Data columns (total 29 columns):
 #   Column                     Non-Null Count  Dtype 
---  ------                     --------------  ----- 
 0   app_name                   27596 non-null  object
 1   release_date               27596 non-null  object
 2   reviews_url                27596 non-null  object
 3   price                      27596 non-null  object
 4   id                         27596 non-null  object
 5   developer                  27596 non-null  object
 6   Accounting                 27596 non-null  bool  
 7   Action                     27596 non-null  bool  
 8   Adventure                  27596 non-null  bool  
 9   Animation &amp; Modeling   27596 non-null  bool  
 10  Audio Production           27596 non-null  bool  
 11  Casual                     27596 non-null  bool  
 12  Design &amp; Illustration  27596 non-null  bool  
 13  Early Access               27596 non-null  bool  
 14  Educat

In [36]:
df_games_2["price"].unique()

array([4.99, 'Free To Play', 'Free to Play', 0.99, 3.99, 9.99, 18.99,
       29.99, 10.99, 2.99, 1.59, 14.99, 1.99, 59.99, 8.99, 6.99, 7.99,
       39.99, 'Free', 19.99, 7.49, 12.99, 5.99, 2.49, 15.99, 1.25, 24.99,
       17.99, 61.99, 3.49, 11.99, 13.99, 'Free Demo', 'Play for Free!',
       34.99, 1.49, 32.99, 99.99, 14.95, 69.99, 16.99, 79.99, 49.99, 5.0,
       13.98, 29.96, 119.99, 109.99, 149.99, 771.71, 'Install Now', 21.99,
       89.99, 'Play WARMACHINE: Tactics Demo', 0.98, 139.92, 4.29,
       'Free Mod', 54.99, 64.99, 74.99, 'Install Theme', 0.89,
       'Third-party', 0.5, 'Play Now', 299.99, 1.29, 44.99, 3.0, 15.0,
       5.49, 23.99, 49.0, 10.93, 1.39, 'Free HITMAN™ Holiday Pack', 36.99,
       4.49, 2.0, 4.0, 234.99, 1.95, 1.5, 199.0, 189.0, 6.66, 27.99,
       129.99, 179.0, 26.99, 399.99, 31.99, 399.0, 20.0, 40.0, 3.33,
       22.99, 320.0, 38.85, 71.7, 995.0, 27.49, 3.39, 6.0, 19.95, 20.99,
       499.99, 199.99, 16.06, 4.68, 131.4, 44.98, 202.76, 2.3, 0.95,
       1

In [37]:
df_games_2["price"].replace(["Free To Play","Free to Play",0.00,'Free to Use','Play the Demo','Free Mod','Free HITMAN™ Holiday Pack','Play WARMACHINE: Tactics Demo','Play for Free!','Free Demo','Free to Try','Play Now','Install Now','Install Theme','Third-party'],"Free",inplace=True)



In [38]:
df_games_2["price"].unique()

array([4.99, 'Free', 0.99, 3.99, 9.99, 18.99, 29.99, 10.99, 2.99, 1.59,
       14.99, 1.99, 59.99, 8.99, 6.99, 7.99, 39.99, 19.99, 7.49, 12.99,
       5.99, 2.49, 15.99, 1.25, 24.99, 17.99, 61.99, 3.49, 11.99, 13.99,
       34.99, 1.49, 32.99, 99.99, 14.95, 69.99, 16.99, 79.99, 49.99, 5.0,
       13.98, 29.96, 119.99, 109.99, 149.99, 771.71, 21.99, 89.99, 0.98,
       139.92, 4.29, 54.99, 64.99, 74.99, 0.89, 0.5, 299.99, 1.29, 44.99,
       3.0, 15.0, 5.49, 23.99, 49.0, 10.93, 1.39, 36.99, 4.49, 2.0, 4.0,
       234.99, 1.95, 1.5, 199.0, 189.0, 6.66, 27.99, 129.99, 179.0, 26.99,
       399.99, 31.99, 399.0, 20.0, 40.0, 3.33, 22.99, 320.0, 38.85, 71.7,
       995.0, 27.49, 3.39, 6.0, 19.95, 20.99, 499.99, 199.99, 16.06, 4.68,
       131.4, 44.98, 202.76, 2.3, 0.95, 172.24, 249.99, 2.97, 10.96, 10.0,
       30.0, 2.66, 6.48, 1.0, 11.15, 99.0, 87.94, 0.49, 9.98, 9.95, 7.0,
       12.89, 6.49, 1.87, 42.99, 41.99, 289.99, 23.96, 5.65, 12.0, 59.95,
       13.37, 189.96, 124.99, 19.98, 160.91

In [39]:
df_games_2

Unnamed: 0,app_name,release_date,reviews_url,price,id,developer,Accounting,Action,Adventure,Animation &amp; Modeling,...,RPG,Racing,Simulation,Software Training,Sports,Strategy,Utilities,Video Production,Web Publishing,nan
88310,Lost Summoner Kitty,2018-01-04,http://steamcommunity.com/app/761140/reviews/?...,4.99,761140,Kotoshiro,False,True,False,False,...,False,False,True,False,False,True,False,False,False,False
88311,Ironbound,2018-01-04,http://steamcommunity.com/app/643980/reviews/?...,Free,643980,Secret Level SRL,False,False,False,False,...,True,False,False,False,False,True,False,False,False,False
88312,Real Pool 3D - Poolians,2017-07-24,http://steamcommunity.com/app/670290/reviews/?...,Free,670290,Poolians.com,False,False,False,False,...,False,False,True,False,True,False,False,False,False,False
88313,弹炸人2222,2017-12-07,http://steamcommunity.com/app/767400/reviews/?...,0.99,767400,彼岸领域,False,True,True,False,...,False,False,False,False,False,False,False,False,False,False
88315,Battle Royale Trainer,2018-01-04,http://steamcommunity.com/app/772540/reviews/?...,3.99,772540,Trickjump Games Ltd,False,True,True,False,...,False,False,True,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
120439,Kebab it Up!,2018-01-04,http://steamcommunity.com/app/745400/reviews/?...,1.99,745400,Bidoniera Games,False,True,True,False,...,False,False,False,False,False,False,False,False,False,False
120440,Colony On Mars,2018-01-04,http://steamcommunity.com/app/773640/reviews/?...,1.99,773640,"Nikita ""Ghost_RUS""",False,False,False,False,...,False,False,True,False,False,True,False,False,False,False
120441,LOGistICAL: South Africa,2018-01-04,http://steamcommunity.com/app/733530/reviews/?...,4.99,733530,Sacada,False,False,False,False,...,False,False,False,False,False,True,False,False,False,False
120442,Russian Roads,2018-01-04,http://steamcommunity.com/app/610660/reviews/?...,1.99,610660,Laush Dmitriy Sergeevich,False,False,False,False,...,False,True,True,False,False,False,False,False,False,False


In [40]:
df_games_2["release_date"] = df_games_2["release_date"].astype(dtype='string')

In [41]:
df_games_2["Year"] = df_games_2.release_date.str.findall(r"\d{4}").str.get(0)

In [None]:
df_games_2.dropna(inplace=True)

In [43]:
df_games_2

Unnamed: 0,app_name,release_date,reviews_url,price,id,developer,Accounting,Action,Adventure,Animation &amp; Modeling,...,Racing,Simulation,Software Training,Sports,Strategy,Utilities,Video Production,Web Publishing,nan,Year
88310,Lost Summoner Kitty,2018-01-04,http://steamcommunity.com/app/761140/reviews/?...,4.99,761140,Kotoshiro,False,True,False,False,...,False,True,False,False,True,False,False,False,False,2018
88311,Ironbound,2018-01-04,http://steamcommunity.com/app/643980/reviews/?...,Free,643980,Secret Level SRL,False,False,False,False,...,False,False,False,False,True,False,False,False,False,2018
88312,Real Pool 3D - Poolians,2017-07-24,http://steamcommunity.com/app/670290/reviews/?...,Free,670290,Poolians.com,False,False,False,False,...,False,True,False,True,False,False,False,False,False,2017
88313,弹炸人2222,2017-12-07,http://steamcommunity.com/app/767400/reviews/?...,0.99,767400,彼岸领域,False,True,True,False,...,False,False,False,False,False,False,False,False,False,2017
88315,Battle Royale Trainer,2018-01-04,http://steamcommunity.com/app/772540/reviews/?...,3.99,772540,Trickjump Games Ltd,False,True,True,False,...,False,True,False,False,False,False,False,False,False,2018
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
120439,Kebab it Up!,2018-01-04,http://steamcommunity.com/app/745400/reviews/?...,1.99,745400,Bidoniera Games,False,True,True,False,...,False,False,False,False,False,False,False,False,False,2018
120440,Colony On Mars,2018-01-04,http://steamcommunity.com/app/773640/reviews/?...,1.99,773640,"Nikita ""Ghost_RUS""",False,False,False,False,...,False,True,False,False,True,False,False,False,False,2018
120441,LOGistICAL: South Africa,2018-01-04,http://steamcommunity.com/app/733530/reviews/?...,4.99,733530,Sacada,False,False,False,False,...,False,False,False,False,True,False,False,False,False,2018
120442,Russian Roads,2018-01-04,http://steamcommunity.com/app/610660/reviews/?...,1.99,610660,Laush Dmitriy Sergeevich,False,False,False,False,...,True,True,False,False,False,False,False,False,False,2018


In [44]:
df_games_2.drop(["release_date"],axis=1,inplace=True)

In [45]:
df_games_2

Unnamed: 0,app_name,reviews_url,price,id,developer,Accounting,Action,Adventure,Animation &amp; Modeling,Audio Production,...,Racing,Simulation,Software Training,Sports,Strategy,Utilities,Video Production,Web Publishing,nan,Year
88310,Lost Summoner Kitty,http://steamcommunity.com/app/761140/reviews/?...,4.99,761140,Kotoshiro,False,True,False,False,False,...,False,True,False,False,True,False,False,False,False,2018
88311,Ironbound,http://steamcommunity.com/app/643980/reviews/?...,Free,643980,Secret Level SRL,False,False,False,False,False,...,False,False,False,False,True,False,False,False,False,2018
88312,Real Pool 3D - Poolians,http://steamcommunity.com/app/670290/reviews/?...,Free,670290,Poolians.com,False,False,False,False,False,...,False,True,False,True,False,False,False,False,False,2017
88313,弹炸人2222,http://steamcommunity.com/app/767400/reviews/?...,0.99,767400,彼岸领域,False,True,True,False,False,...,False,False,False,False,False,False,False,False,False,2017
88315,Battle Royale Trainer,http://steamcommunity.com/app/772540/reviews/?...,3.99,772540,Trickjump Games Ltd,False,True,True,False,False,...,False,True,False,False,False,False,False,False,False,2018
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
120439,Kebab it Up!,http://steamcommunity.com/app/745400/reviews/?...,1.99,745400,Bidoniera Games,False,True,True,False,False,...,False,False,False,False,False,False,False,False,False,2018
120440,Colony On Mars,http://steamcommunity.com/app/773640/reviews/?...,1.99,773640,"Nikita ""Ghost_RUS""",False,False,False,False,False,...,False,True,False,False,True,False,False,False,False,2018
120441,LOGistICAL: South Africa,http://steamcommunity.com/app/733530/reviews/?...,4.99,733530,Sacada,False,False,False,False,False,...,False,False,False,False,True,False,False,False,False,2018
120442,Russian Roads,http://steamcommunity.com/app/610660/reviews/?...,1.99,610660,Laush Dmitriy Sergeevich,False,False,False,False,False,...,True,True,False,False,False,False,False,False,False,2018


In [46]:
free = (df_games_2["price"] == "Free")

In [47]:
df_dev = df_games_2[["Year","developer","price"]][free]

In [48]:
df_dev

Unnamed: 0,Year,developer,price
88311,2018,Secret Level SRL,Free
88312,2017,Poolians.com,Free
88370,2006,Unknown Worlds Entertainment,Free
88501,2008,Sandstorm Productions,Free
88558,2009,Darklight Games,Free
...,...,...,...
120287,2017,Screenhit Studios,Free
120303,2017,ebi-hime,Free
120317,2018,Engin Mercan,Free
120410,2018,杭州分浪网络科技有限公司,Free


In [None]:
def developer(developer):
    x = developer
            
