In [None]:
import os
for dirname,_,filenames in os.walk('/kaggle/input'):
    for filename in filenames:
        print(os.path.join(dirname,filename))

In [None]:
import pandas as pd
import numpy as np

In [None]:
kiva = pd.read_csv('/kaggle/input/data-science-for-good-kiva-crowdfunding/kiva_loans.csv')

### First i imported the header contents of the Kiva  loans Report. so that i would have clear knowledge of what i am going to work with.

In [None]:
kiva.head(2)

### Here i pulled out the countries in Kiva loans report and arranged them in descending order according to the loans they receive.
### This shows that Phillipines, Kenya, United states, Peru and Paraguay have the most loan amounts. 

In [None]:
loans = kiva.groupby('country')['loan_amount'].sum().sort_values(ascending = False).reset_index()
loans

### Then i did the same arrangement, descending order for loans taken up by different sectors and we get to see that
### Agriculture, food, retail, Services and Clothing take up the biggest loans.

In [None]:
sector = kiva.groupby('sector')['loan_amount'].sum().sort_values(ascending = False).reset_index().head(10)
sector

## So i come to my analysis of Mexico, the country i chose to analysis.
### I did the sam thing first, run the header information of Mexico to see what i am working with.

In [None]:
Mexico = kiva[kiva['country'] == 'Mexico'].reset_index(drop = True)
Mexico.head(2)

### Here i get to see the in-deepth information per column Header Mexico has

In [None]:
Mexico.info()

### I looked for the columns that have empty cells, and they were 5. Though i didint drop any cells or columns.

In [None]:
Mexico.isna().sum()

### Looked at the sectors in Mexico that had the highest loans

**Mexico just like the world has the top three sectors as Agriculture, Retail and Food, meaning it moves/works with the worlds standards**

In [None]:
Mexico_sector = Mexico.groupby('sector')['loan_amount'].sum().sort_values(ascending = False).reset_index().head(10)
Mexico_sector

#### Here i looked at the gender ratio of Kiva report that take loans, and its a 76.53% to 23.0% ,with the females having the 76.53% and the male having 23.0%

In [None]:
def gender_lead(gender):
    gender = str(gender)
    if gender.startswith('f'):
        gender = 'female'
    else:
        gender = 'male'
    return gender

In [None]:
kiva['gender_lead'] = kiva['borrower_genders'].apply(gender_lead)
kiva['gender_lead'].nunique()

In [None]:
f = kiva['gender_lead'].value_counts()[0]
m = kiva['gender_lead'].value_counts()[1]

print('{} females ({}%) vs {} males ({}%) got loans'.format(f,round(f*100/(f+m),2),m,round(m*100/(f+m)),2))

#### When you compare the gender ratio of Kiva Vs Mexico report, we notice that they both have females as the majority loan takers, only that in the case of Mexico the ratio differe between females and males is not that big

In [None]:
Mexico['gender_lead'] = Mexico['borrower_genders'].apply(gender_lead)
Mexico['gender_lead'].nunique()

In [None]:
f = Mexico['gender_lead'].value_counts()[0]
m = Mexico['gender_lead'].value_counts()[1]

print('{} females ({}%) vs {} males ({}%) got loans'.format(f,round(f*100/(f+m),2),m,round(m*100/(f+m)),2))

#### Mexico has more Females than Males and the %is 57.1% to 43.0%

In [None]:
Mexico_activity = Mexico.groupby('activity')['loan_amount'].sum().sort_values(ascending = False).reset_index().head(10)
Mexico_activity

#### When we look at Activity vs loan amount for Mexico records we notice that Personal Medical Expenses, Animal sales and General Store have the highest loans.

In [None]:
Mexico_region = Mexico.groupby('region')['loan_amount'].sum().sort_values(ascending = False).reset_index().head(10)
Mexico_region

#### Then when we compare region and loan amounts, Tiera Blanca, Monterrey and San Miguel get funded most in mexico.

In [None]:
Mexico_laonPaymentMethod = Mexico.groupby('repayment_interval')['loan_amount'].sum().sort_values(ascending = False).reset_index().head(10)
Mexico_laonPaymentMethod

#### Payment of Loans in mexico are more of irregular then followed by those who pay monthly.

### PLOTTING OF GRAPHS SHOWING THE TREND OF LOAN AMOUNTS IN MEXICO

In [None]:
import matplotlib.pyplot as plt
import warnings

warnings.filterwarnings('ignore')

In [None]:
Mexico.head(2)

### Defining the Itemas i am going to use for the graph that has information on the different sectors of Mexico.

In [None]:
sector_df = Mexico.groupby('sector')['loan_amount', 'lender_count', 'funded_amount',].sum()\
         .sort_values(by = 'loan_amount', ascending = False).reset_index().head(10)

sector_df

In [None]:
activity_df = Mexico.groupby('activity')['loan_amount', 'lender_count', 'funded_amount'].sum()\
         .sort_values(by = 'loan_amount', ascending = False).reset_index().head(10)

activity_df

### Defining the Itemas i am going to use for the graph that has information on the different Activities of Mexico.

In [None]:
sector = sector_df['sector']
activity = activity_df['activity']
loan = sector_df['loan_amount']
fund = sector_df['funded_amount']
lender = sector_df['lender_count']
lender_1 = activity_df['lender_count']

**1. LOAN AMOUNT AGAINST SECTOR**

In [None]:
plt.figure(figsize = (10,5))

plt.title('Loan Amount by Sector', fontsize = 20)
plt.xlabel('Sector', fontsize = 15)
plt.ylabel('Loan Amount', fontsize = 15)

plt.xticks(rotation = 75)

plt.plot(sector, loan)

plt.show()

From the graph above we can note that Mexico counts its stability on Agriculture, Retail, Food and Health thats why they get the most loan amounts, and when we look at housing to Manufacturing, the curve is almost stright which means they are comfortable with those Sectors and they dont really need to get loans to keep them running.what they make as a country is enough to support them

**2. LOAN AMOUNT AND FUNDED AMOUNT AGAINST ACTIVITY**

In [None]:
plt.figure(figsize = (10,5))

plt.title('Loan Amount and Funded Amount by activity', fontsize = 15)
plt.xlabel('activity', fontsize = 15)
plt.ylabel('Loan Amount', fontsize = 15)

plt.xticks(rotation = 75)

plt.plot(activity, fund, c = 'k', label = 'Funded Amount')
plt.bar(activity, loan, label = 'Loan Amount')

plt.legend()

plt.show()

In the graph above, we see that from Personal Medical Expenses to Agriculture, Mexico has to get loans in order to support these activities in order to contibue thrieving, while from Retail to Taxi, what the country makes from within, its able to thrieve / surviev without borrowing.

**3. SECTOR AGAINST LOAN AMOUNT**

In [None]:
plt.figure(figsize = (10,5))

plt.title('Loan Amount by Sector', fontsize = 15)
plt.ylabel('Sector', fontsize = 15)
plt.xlabel('Loan Amount', fontsize = 15)

plt.xticks(rotation = 75)

sector_l = list(sector)
loan_l = list(loan)

sector_l.reverse()
loan_l.reverse()

plt.barh(sector_l, loan_l)

plt.show()

From the graph above, we can also say that Mexico relies on Agriculture, Retail, Food and Health to grow and make profits for the country that is why it gets loans to boast these different sectors. 

**4. SCATTER PLOT FOR LOAN AMOUNT VS LENDER COUNT**

In [None]:
plt.figure(figsize = (10,5))

plt.title('Loan Amount vs Lender Count', fontsize = 20)
plt.xlabel('Loan Amount', fontsize = 15)
plt.ylabel('Lender Count', fontsize = 15)

colour = np.arange(len(sector))

plt.xticks(rotation = 75)

plt.scatter(loan, lender, c = colour, cmap = 'Blues', marker = 'o', s = loan/1000, edgecolor = 'k', alpha = 1.0)

plt.show()

For the scatter graph above, the darker the blue and the smaller the circle the lease the amount of loan and lender count a sector takes up.

#### GRAPHS BELOW SHOW A COMPRESSED VIEW OF THE LOAN AMOUNT,LENDER COUNT VS SECTOR and also the DISTRIBUTION OF TERMS IN MONTHS FOR MEXICO

In [None]:
plt.figure(figsize = (20,20))
plt.subplot(2,2,1)
plt.title('Loan Amount by Sector')

plt.xticks(rotation = 45)

plt.plot(sector, loan)


plt.subplot(2,2,2)
plt.title('Distribution of Term in Months')

plt.xticks(rotation = 45)

plt.hist(Mexico['term_in_months'], edgecolor = 'k', bins = 15)


plt.subplot(2,2,3)
plt.title('Lender Count by Sector')

plt.bar(sector, lender)


plt.subplot(2,2,4)
colours = np.arange(len(sector_df['sector']))

plt.title('Loan Amount vs Lender Count')

plt.scatter(sector, lender, c = colours, cmap = 'Blues',
            marker = 'o', edgecolor = 'k', alpha = 0.75, s = sector_df['loan_amount']/1000)


plt.savefig('plot.png')
plt.show()

#### Below is a pie chart that shows clearly the perecentages of Female to Males that get loans in Mexico. 

In [None]:
Gender2 = ['Females', 'Males'] 
 
data = [57.1, 43.0] 
  
fig = plt.figure(figsize =(10, 7)) 
plt.pie(data, labels = Gender2) 
  
plt.show() 

**THANK YOU**