# Analysis video games
![game](https://png.pngtree.com/thumb_back/fw800/back_our/20190621/ourmid/pngtree-game-castle-dark-banner-image_178457.jpg)

In [None]:
import numpy as np # linear algebra
import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)

Fields include:

1. Rank - Ranking of overall sales
2. Name - The games name
3. Platform - Platform of the games release (i.e. PC,PS4, etc.)
4. Year - Year of the game's release
5. Genre - Genre of the game
6. Publisher - Publisher of the game
7. NA_Sales - Sales in North America (in millions)
8. EU_Sales - Sales in Europe (in millions)
9. JP_Sales - Sales in Japan (in millions)
10. Other_Sales - Sales in the rest of the world (in millions)
11. Global_Sales - Total worldwide sales.

In [None]:
df_games = pd.read_csv("../input/videogamesales/vgsales.csv")
df_games.head()

In [None]:
import matplotlib.pyplot as plt
%matplotlib inline
import seaborn as sns
import matplotlib

In [None]:
def plot_count(df, col):
    plot = pd.DataFrame(df.groupby(col).Rank.count())
    plot = plot.rename(columns={"Rank": "count"})

    plt.figure(figsize=(22,6))
    sns.barplot(x=plot.index, y=plot["count"])
    plot.plot.pie(y='count', figsize=(14, 14)).legend(title=col, loc="center left", bbox_to_anchor=(1, 0, 0.5, 1))
    plt.show()

# Platform

In [None]:
plot_count(df_games, "Platform")

# Year (count>60)

In [None]:
df_year = pd.DataFrame(df_games.groupby("Year").Rank.count()).reset_index()
df_year = df_year.rename(columns={"Rank": "count"})

df_year = df_year.loc[df_year["count"] > 60]
df_year = df_year.astype('int64')

df_year.index = df_year["Year"]
df_year = df_year.drop("Year", axis=1)

plt.figure(figsize=(22,6))
sns.barplot(x=df_year.index, y=df_year["count"])
df_year.plot.pie(y='count', figsize=(14, 14)).legend(title="Year", loc="center left", bbox_to_anchor=(1, 0, 0.5, 1))
plt.show()

# Genre	

In [None]:
plot_count(df_games, "Genre")

# Publisher (count>300)

In [None]:
df_Publisher = pd.DataFrame(df_games.groupby("Publisher").Rank.count())
df_Publisher = df_Publisher.rename(columns={"Rank": "count"})

df_Publisher = df_Publisher.loc[df_Publisher["count"] > 300]

ingredients = list(df_Publisher.index)
plt.figure(figsize=(22,6))
a = sns.barplot(x=df_Publisher.index, y=df_Publisher["count"])
a.set_xticklabels(labels=df_Publisher.index, rotation=-65) 

df_Publisher.plot.pie(y='count', figsize=(14, 14)).legend(title="Publisher", loc="center left", bbox_to_anchor=(1, 0, 0.5, 1))
plt.show()

# Top 3 video games

1. NA_Sales - Sales in North America (in millions)
2. EU_Sales - Sales in Europe (in millions)
3. JP_Sales - Sales in Japan (in millions)
4. Other_Sales - Sales in the rest of the world (in millions)
5. Global_Sales - Total worldwide sales.

## Sales in North America (in millions)

In [None]:
df_games.sort_values(by='NA_Sales', ascending=False).head(3)

## EU_Sales - Sales in Europe (in millions)

In [None]:
df_games.sort_values(by='EU_Sales', ascending=False).head(3)

## Sales in Japan (in millions)

In [None]:
df_games.sort_values(by='JP_Sales', ascending=False).head(3)

## Sales in the rest of the world (in millions)

In [None]:
df_games.sort_values(by='Other_Sales', ascending=False).head(3)

## Total worldwide sales

In [None]:
df_games.sort_values(by='Global_Sales', ascending=False).head(3)