In [None]:
# This Python 3 environment comes with many helpful analytics libraries installed
# It is defined by the kaggle/python Docker image: https://github.com/kaggle/docker-python
# For example, here's several helpful packages to load

import numpy as np # linear algebra
import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)

# Input data files are available in the read-only "../input/" directory
# For example, running this (by clicking run or pressing Shift+Enter) will list all files under the input directory

import os
for dirname, _, filenames in os.walk('/kaggle/input'):
    for filename in filenames:
        print(os.path.join(dirname, filename))

# You can write up to 20GB to the current directory (/kaggle/working/) that gets preserved as output when you create a version using "Save & Run All" 
# You can also write temporary files to /kaggle/temp/, but they won't be saved outside of the current session

In [None]:
import matplotlib.pyplot as plt

In [None]:
df = pd.read_csv("/kaggle/input/time-use-employment-and-gdp-per-country/Time_use_OECD.csv")
df

In [None]:
df.info()

**We convert a str attribute (Minutes_per_day) to an integer**

In [None]:
df["Minutes_per_day"] = df["Minutes_per_day"].astype(np.int64)

**Now we check the convertion**

In [None]:
df.info()

**We add a variable to the dataset to reflect the amount of hours spent in each register.**

In [None]:
df["Hours"] = (df["Minutes_per_day"]/60).round(2)
df

**We analyze the number of hours dedicated according to Description.**

In [None]:
hours_per_description = df.pivot_table(index = ["Description"], values=["Hours"]).round(1).sort_values("Hours", ascending=True)
hours_per_description

**We graph it.**

In [None]:
plt.figure(figsize=(5,5))
plt.plot(hours_per_description.index, hours_per_description.values, linewidth=3)
plt.xticks(rotation=90)
plt.grid(visible=True, axis="both", which="major", color='c', linestyle='-.', linewidth=0.5)
plt.tick_params(labelcolor='c', labelsize='medium', width=2)
plt.show()

**We analyze the number of hours dedicated to each description by gender.**

In [None]:
description_sex = df.pivot_table(index = ["Description"], columns=["Sex"], values=["Hours"]).round(2)
description_sex

**We graph the distribution.**

In [None]:
plt.figure(figsize=(5,5))
plt.plot(description_sex.index, description_sex.values, label=("Men", "Women"), linewidth=3)
plt.xticks(rotation=90)
plt.style.use('fivethirtyeight')
plt.grid(visible=True, axis="both", which="major", color='c', linestyle=':', linewidth=0.5, alpha=0.5)
plt.legend()
plt.show()

**Let's see the number of hours dedicated to unpaid work, filtering the top ten countries.**

In [None]:
unpaid_work = df.query("Description == 'Unpaid work'").sort_values("Hours", ascending=False).iloc[0:10:1]
unpaid_work

**Let's graph it.**

In [None]:
plt.figure(figsize=(5,5))
plt.plot(unpaid_work["Country"], unpaid_work["Hours"], alpha=(0.5), c="g", linewidth=3, animated=True)
plt.grid()
plt.style.use('fivethirtyeight')
plt.title("Unpaid work per top 10 country", size=12)
plt.ylabel("Hours spent", size=12)
plt.xlabel("Country", size=12)
plt.grid(visible=True, axis="both", which="major", linestyle=':', linewidth=0.5)
plt.tick_params(labelcolor='black', labelsize='small', width=2, grid_color='r')
plt.xticks(rotation=90)
plt.show()