<a href="https://colab.research.google.com/github/Utpal-Mishra/Omdena-Egypt-Local-Chapter-2021-Notebooks/blob/main/OmdenaEgypt2021AnalysisPart2.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

### **IMPORT DRIVE**

In [None]:
from google.colab import drive
drive.mount('/content/drive')

print("Drive Mounted!!!")

Mounted at /content/drive
Drive Mounted!!!


### **IMPORT LIBRARIES**

In [None]:
import pandas as pd
import plotly.express as px
import plotly.graph_objects as go

print("Libraries Imported!!!")

Libraries Imported!!!


### **IMPORT DATA**

In [None]:
import datetime

path = "/content/drive/MyDrive/Omdena/Egypt 2021/freshwater_withdrawals.csv"

data = pd.read_csv(path)
data = data.drop(["Unnamed: 0"], axis = 1)
data.rename(columns = {'country_name':'Country Name', 'country_iso3':'Country Code', 'year':'Year', 
             'indicator_name':'Indicator Name', 'indicator_code':'Indicator Code', 'value':'Value', 'units': 'Units'}, inplace = True)
print("Data Shape: ", data.shape)

data = data.sort_values(['Units', 'Indicator Name', 'Year'])
data = data.reset_index()
data = data[['Year', 'Indicator Name', 'Value', 'Units']]
data.head()

Data Shape:  (197, 7)


Unnamed: 0,Year,Indicator Name,Value,Units
0,1977,Water productivity,0.780681,total (constant 2010 US$ GDP per cubic meter ...
1,1982,Water productivity,1.107434,total (constant 2010 US$ GDP per cubic meter ...
2,1987,Water productivity,1.416261,total (constant 2010 US$ GDP per cubic meter ...
3,1992,Water productivity,1.68894,total (constant 2010 US$ GDP per cubic meter ...
4,1997,Water productivity,1.844611,total (constant 2010 US$ GDP per cubic meter ...


## **EXPLORATORY DATA ANALYSIS**

### **Checking Missing Values**

In [None]:
data.isna().sum()

Year              0
Indicator Name    0
Value             0
Units             0
dtype: int64

### **Frequency of Indicator Names in Egypt**

In [None]:
data['Indicator Name'].value_counts() 

Annual freshwater withdrawals                                                          56
People using at least basic drinking water services                                    36
People with basic handwashing facilities including soap and water                      36
People using at least basic drinking water services (% of population)                  18
People with basic handwashing facilities including soap and water (% of population)    18
Renewable internal freshwater resources                                                12
Renewable internal freshwater resources per capita (cubic meters)                      12
Water productivity                                                                      9
Name: Indicator Name, dtype: int64

## **PLOTS**

### **Plotting Functions**

In [None]:
import plotly.express as px

def plot(df, title, name, color, dash):
  fig = go.Figure()
  fig = px.scatter(df, x=df.index, y="Value", size = "Value", color = "Value")
  fig.add_trace(go.Scatter(x=df.index, y=df.Value, name = name, line=dict(color=color, width=2, dash = dash)))
  fig.update_xaxes(title_text = "Year", rangeslider_visible=True, linewidth=2, linecolor='black', mirror=True)
  fig.update_yaxes(title_text = "Value", showline=True, linewidth=2, linecolor='black', mirror=True)
  fig.update_layout(height=500, width=1000, title_text=title, xaxis_tickangle=-90) 
  fig.show()

### **Water productivity** 

In [None]:
df = data[data["Indicator Name"] == "Water productivity"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "Water productivity in Egypt", "total (constant 2010 US$ GDP per cubic meter of total freshwater withdrawal)", "red", "dash")

### **People using at least basic drinking water services (% of population)** 

In [None]:
df = data[data["Indicator Name"] == "People using at least basic drinking water services (% of population)"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "People using at least basic drinking water services (% of population) in Egypt", "% of population", "red", "dash")

### **People with basic handwashing facilities including soap and water (% of population)** 

In [None]:
df = data[data["Indicator Name"] == "People with basic handwashing facilities including soap and water (% of population)"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "People with basic handwashing facilities including soap and water (% of population)", "% of population", "red", "dot")

### **Renewable internal freshwater resources** 

In [None]:
df = data[data["Units"] == "total (billion cubic meters)"]
df = df[df["Indicator Name"] == "Renewable internal freshwater resources"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "Renewable internal freshwater resources in Egypt", "total (billion cubic meters)", "red", "dot")

### **Renewable internal freshwater resources per capita (cubic meters)** 

In [None]:
df = data[data["Indicator Name"] == "Renewable internal freshwater resources per capita (cubic meters)"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "Renewable internal freshwater resources per capita (cubic meters) in Egypt", "cubic meters", "red", "dot")

### **Annual freshwater withdrawals (agriculture)** 

In [None]:
df = data[data["Indicator Name"] == "Annual freshwater withdrawals"]
df = df[df["Units"] == "agriculture (% of total freshwater withdrawal)"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "Annual freshwater withdrawals in Egypt", "industry (% of total freshwater withdrawal)", "red", "dot")

### **Annual freshwater withdrawals (domestic)** 

In [None]:
df = data[data["Units"] == "domestic (% of total freshwater withdrawal)"]
df = df[df["Units"] == "domestic (% of total freshwater withdrawal)"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "Annual freshwater withdrawals in Egypt", "Domestic (% of total freshwater withdrawal)", "red", "dot")

### **Annual freshwater withdrawals in total (billion cubic meters)** 

In [None]:
df = data[data["Units"] == "total (billion cubic meters)"]
df = df[df["Indicator Name"] == "Annual freshwater withdrawals"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "Annual freshwater withdrawals in Egypt", "total (billion cubic meters)", "red", "dot")

### **People using at least basic drinking water services (rural)** 

In [None]:
df = data[data["Indicator Name"] == "People using at least basic drinking water services"]
df = df[df["Units"] == "rural (% of rural population)"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "People using at least basic drinking water services", "% of rural population", "red", "dot")

### **People using at least basic drinking water services (urban)** 

In [None]:
df = data[data["Indicator Name"] == "People using at least basic drinking water services"]
df = df[df["Units"] == "urban (% of urban population)"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "People using at least basic drinking water services", "% of urban population", "red", "dot")

### **People with basic handwashing facilities including soap and water (rural)** 

In [None]:
df = data[data["Indicator Name"] == "People with basic handwashing facilities including soap and water"]
df = df[df["Units"] == "rural (% of rural population)"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "People with basic handwashing facilities including soap and water in Egypt", "% of rural population", "red", "dot")

### **People with basic handwashing facilities including soap and water  (urban)** 

In [None]:
df = data[data["Indicator Name"] == "People with basic handwashing facilities including soap and water"]
df = df[df["Units"] == "urban (% of urban population)"]
df = df[["Year", "Value"]]
df.set_index("Year", inplace = True)

plot(df, "People with basic handwashing facilities including soap and water in Egypt", "% of urban population", "red", "dot")