# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [None]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [None]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [None]:
city_table = pd.read_csv('../output_data/cities.csv')
city_data = pd.DataFrame(city_table)
city_data

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
humidity_100= city_data[city_data.Humidity >=100]

In [None]:
#  Get the indices of cities that have humidity over 100%.
humidity_100.City.sort_values()

In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".
clean_city_data = weather_df.drop(index=weather_df[weather_df['Humidity'] >=100].index)

In [None]:
clean_city_data.shape

## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

In [None]:
x_values = clean_city_data['Max Temp']
y_values = clean_city_data['Lat']
plt.scatter(x_values,y_values)
plt.xlabel('Max Temp')
plt.ylabel('Lat')
plt.title('Max Temperature (F) vs Latitude')
plt.show()
plt.savefig("Latitude vs Temperature Plot.png")

The futher the Latitude from the equator (0), the Max Temperature is become much lower.  The closer the latitude toward the equator, the Max temperature is much higher. 

## Latitude vs. Humidity Plot

In [None]:
#Scatter Plot for Humidity (%) vs Latitude
x_values = clean_city_data['Humidity']
y_values = clean_city_data['Lat']
plt.scatter(x_values,y_values)
plt.xlabel('Humidity (%)')
plt.ylabel('Lat')
plt.title('Humidity vs Latitude')
plt.show()
plt.savefig("Latitude vs Humidity Plot.png")

In the Humidity vs Latitude, it's appears to spread equally through out both side of latitude.  

## Latitude vs. Cloudiness Plot

In [None]:
x_values = clean_city_data['Cloudiness']
y_values = clean_city_data['Lat']
plt.scatter(x_values,y_values)
plt.xlabel('Cloudiness (%)')
plt.ylabel('Lat')
plt.title('Cloudiness vs Latitude')
plt.show()
plt.savefig("Latitude vs Cloudiness Plot.png")

The cloudiness % between both side of the latitude are about the same. There is no particular plot. 

## Latitude vs. Wind Speed Plot

In [None]:
#Scatter Plot for Wind Speed (mph) vs Latitude
x_values = clean_city_data['Wind Speed']
y_values = clean_city_data['Lat']
plt.scatter(x_values,y_values)
plt.xlabel('Wind Speed')
plt.ylabel('Lat')
plt.title('Wind Speed vs Latitude')
plt.show()
plt.savefig("Latitude vs Wind Speed Plot.png")

## Linear Regression

In [None]:
#Scatter Plot for Humidity (%) vs Latitude

# Perform a linear regression on temperature vs. latitude
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)

# Get regression values
x_values = clean_city_data['Max Temp']
y_values = clean_city_data['Lat']
plt.scatter(x_values,y_values)

regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.plot(x_values,regress_values,"r-")

plt.xlabel('Max Temp (%)')
plt.ylabel('Lat')
plt.title('Max Temp vs Latitude Linear Regression')
plt.annotate(line_eq,(70,-50),fontsize=15,color="red")

# Print r value
print(f"The r-value is: {rvalue**2}")

plt.show()
plt.savefig("Latitude vs Max Temp Plot Linear Regression.png")

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
NH_clean_city_data = clean_city_data[clean_city_data.Lat>=0]

(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)

x_values = NH_clean_city_data['Max Temp']
y_values = NH_clean_city_data['Lat']

regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.plot(x_values,regress_values,"r-")

print(f"The r-value is: {rvalue**2}")
plt.scatter(x_values,y_values)
plt.xlabel('Max Temp')
plt.ylabel('Lat')
plt.title('Northern Hemisphere Max Temperature (F) vs Latitude')
plt.annotate(line_eq,(10,0),fontsize=15,color="red")
plt.show()
plt.savefig("North Latitude vs Temperature Plot.png")

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
SH_clean_city_data = clean_city_data[clean_city_data.Lat<0]

(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)

x_values = SH_clean_city_data['Max Temp']
y_values = SH_clean_city_data['Lat']

regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.plot(x_values,regress_values,"r-")

print(f"The r-value is: {rvalue**2}")
plt.scatter(x_values,y_values)
plt.xlabel('Max Temp')
plt.ylabel('Lat')
plt.title('Southern Hemisphere Max Temperature (F) vs Latitude')
plt.annotate(line_eq,(70,-40),fontsize=15,color="red")
plt.show()
plt.savefig("South Latitude vs Temperature Plot.png")

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)

x_values = NH_clean_city_data['Humidity']
y_values = NH_clean_city_data['Lat']

regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.plot(x_values,regress_values,"r-")

print(f"The r-value is: {rvalue**2}")
plt.scatter(x_values,y_values)
plt.xlabel('Humidity')
plt.ylabel('Lat')
plt.title('Northern Hemisphere Humidity vs Latitude')
plt.annotate(line_eq,(10,0),fontsize=15,color="red")
plt.show()
plt.savefig("North Latitude vs Humidity Plot.png")

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)

x_values = SH_clean_city_data['Humidity']
y_values = SH_clean_city_data['Lat']

regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.plot(x_values,regress_values,"r-")

print(f"The r-value is: {rvalue**2}")
plt.scatter(x_values,y_values)
plt.xlabel('Humidity')
plt.ylabel('Lat')
plt.title('Southern Hemisphere Humidity vs Latitude')
plt.annotate(line_eq,(70,-50),fontsize=15,color="red")
plt.show()
plt.savefig("South Latitude vs Humidity Plot.png")

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_values = NH_clean_city_data['Cloudiness']
y_values = NH_clean_city_data['Lat']

regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.plot(x_values,regress_values,"r-")

print(f"The r-value is: {rvalue**2}")
plt.scatter(x_values,y_values)
plt.xlabel('Cloudiness')
plt.ylabel('Lat')
plt.title('Northern Hemisphere Cloudiness vs Latitude')
plt.annotate(line_eq,(10,0),fontsize=15,color="red")
plt.show()
plt.savefig("North Latitude vs Cloudiness Plot.png")

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_values = SH_clean_city_data['Cloudiness']
y_values = SH_clean_city_data['Lat']

regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.plot(x_values,regress_values,"r-")

print(f"The r-value is: {rvalue**2}")
plt.scatter(x_values,y_values)
plt.xlabel('Cloudiness')
plt.ylabel('Lat')
plt.title('Southern Hemisphere Cloudiness vs Latitude')
plt.annotate(line_eq,(70,-50),fontsize=15,color="red")
plt.show()
plt.savefig("South Latitude vs Cloudiness Plot.png")

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_values = NH_clean_city_data['Wind Speed']
y_values = NH_clean_city_data['Lat']

regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.plot(x_values,regress_values,"r-")

print(f"The r-value is: {rvalue**2}")
plt.scatter(x_values,y_values)
plt.xlabel('Wind Speed')
plt.ylabel('Lat')
plt.title('Northern Hemisphere Wind Speed vs Latitude')
plt.annotate(line_eq,(10,-10),fontsize=15,color="red")
plt.show()
plt.savefig("North Latitude vs Wind Speed Plot.png")

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_values = SH_clean_city_data['Wind Speed']
y_values = SH_clean_city_data['Lat']

regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.plot(x_values,regress_values,"r-")

print(f"The r-value is: {rvalue**2}")
plt.scatter(x_values,y_values)
plt.xlabel('Wind Speed')
plt.ylabel('Lat')
plt.title('Southern Hemisphere Wind Speed vs Latitude')
plt.annotate(line_eq,(10,-50),fontsize=15,color="red")
plt.show()
plt.savefig("South Latitude vs Wind Speed Plot.png")