# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [2]:
import os
import csv
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress
from pprint import pprint
import datetime

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [3]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

637

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [4]:
new_cities = []
country = []
date = []
temp = []
humidity = []
lat = []
lng = []
cloudiness = []
wind = []

In [None]:
record_counter = 0
set_counter = 0

# URL < Weather Map API Call >

weather_api_key = "25691d94d9685987788b6b5fa530cfcf"
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key 
print('------------------------')
print('Fetching Data Requests')
print('------------------------')

for city in cities:
    query_url = url + "&q=" + city
    # Get weather data
    response = requests.get(query_url).json()
    if record_counter < 50:
        record_counter += 1
    else:
        set_counter += 1
        record_counter = 0

    print('Processing record {} of set {} | {}'.format(record_counter, set_counter, city))
    print(url)
    try:
        date.append(response['dt'])
        country.append(response['sys']['country'])
        lat.append(response['coord']['lat'])
        lng.append(response['coord']['lon'])
        temp.append(response['main']['temp_max'])
        humidity.append(response['main']['humidity'])
        wind.append(response['wind']['speed'])
        cloudiness.append(response['clouds']['all'])
        new_cities.append(city)
    except:
        print("CITY NOT FOUND")
        pass

print('-------------------------')
print('Data Download Complete')
print('-------------------------')

------------------------
Fetching Data Requests
------------------------
Processing record 1 of set 0 | xuddur
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 2 of set 0 | mataura
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 3 of set 0 | dingle
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 4 of set 0 | norman wells
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 5 of set 0 | sakakah
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 6 of set 0 | zhigansk
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 7 of set 0 | albany
http://api.openweathermap.org/data/2.5/weathe

Processing record 8 of set 1 | lebu
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 9 of set 1 | meyungs
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
CITY NOT FOUND
Processing record 10 of set 1 | ponta do sol
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 11 of set 1 | hilo
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 12 of set 1 | nanortalik
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 13 of set 1 | kapaa
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 14 of set 1 | rengo
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Pr

Processing record 14 of set 2 | beira
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 15 of set 2 | narsaq
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 16 of set 2 | puerto ayora
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 17 of set 2 | nortelandia
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 18 of set 2 | coffs harbour
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 19 of set 2 | ribeira grande
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa530cfcf
Processing record 20 of set 2 | victoria
http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25691d94d9685987788b6b5fa5

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [None]:
weather_dict = {
    "City": new_cities,
    "Country": country,
    "Date": date,
    "Lat": lat,
    "Lng": lng,
    "Temp": temp,
    "Humidity": humidity,
    "Cloudiness": cloudiness,
    "Wind Speed": wind
}
weather_data = pd.DataFrame(weather_dict)
weather_data.count()

In [None]:
weather_data.head()

In [None]:
cities_list = zip(new_cities,cloudiness,country,date,humidity,temp,lat,lng)

# Set Output File Variable
output_file = os.path.join('..', 'output_data', 'cities.csv')

# Open Output File
with open(output_file, 'w') as datafile:
    weather_data.to_csv(output_file)

### Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

#### Latitude vs. Temperature Plot

In [None]:
weather_data.plot(kind='scatter', x='Lat', y='Temp', c='DarkBlue')
plt.title('City Latitude vs Temperature')
plt.xlabel('Latitude')
plt.ylabel('Max Temperature (F)')
plt.grid()
plt.savefig("../output_data/Latitude_vs_Temperature.png")
plt.grid()

#### Latitude vs. Humidity Plot

In [None]:
weather_data.plot(kind='scatter',x='Lat',y='Humidity', c='DarkBlue')
plt.title('City Latitude vs Humidity')
plt.xlabel('Latitude')
plt.ylabel('Humidity (%)')
plt.grid()
plt.savefig("../output_data/Latitude_vs_Humidity.png")
plt.grid()

#### Latitude vs. Cloudiness Plot

In [None]:
weather_data.plot(kind='scatter',x='Lat',y='Cloudiness', c='DarkBlue')
plt.title('City Latitude vs Cloudiness')
plt.xlabel('Latitude')
plt.ylabel('Cloudiness (%)')
plt.grid()
plt.savefig("../output_data/Latitude_vs_Cloudiness.png")
plt.grid()

#### Latitude vs. Wind Speed Plot

In [None]:
weather_data.plot(kind='scatter',x='Lat',y='Wind Speed', c='DarkBlue')
plt.title('City Latitude vs Wind Speed')
plt.xlabel('Latitude')
plt.ylabel('Wind Speed (mph)')
plt.grid()
plt.savefig("../output_data/Latitude_vs_Wind_Speed.png")
plt.grid()

## Linear Regression

In [None]:
# OPTIONAL: Create a function to create Linear Regression plots

# def make_lin_reg_plot(x_values,y_values,x_desc,y_desc,hemisphere,filename,x_ann,y_ann):
    # Print out the r-squared value along with the plot.
    # (slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
    # regress_values = x_values * slope + intercept
    # line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
    # plt.scatter(x_values,y_values,edgecolors='black')
    # plt.plot(x_values,regress_values,"r-")
    # plt.title(f"{hemisphere}-\nCity {x_desc} vs. {y_desc} {weatherDate}")
    # plt.annotate(line_eq,(x_ann,y_ann),fontsize=15,color="red")
    # plt.xlabel(x_desc)
    # plt.ylabel(y_desc)
    # print(f"The r-squared is: {rvalue}")
    # print(line_eq)
    # plt.savefig(f'Figures/{filename}')
    # plt.show()

In [None]:
# Create Northern and Southern Hemisphere DataFrames

North_df = weather_data.loc[weather_data['Lat'] >=0]
South_df = weather_data.loc[weather_data['Lat'] < 0]

North_df.head()

In [None]:
South_df.head()

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_values = North_df['Lat'].astype('float')
y_values = North_df['Temp'].astype('float')

# Regression
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
rvalue = "R:Value=" + "  " + str(round(rvalue, 2))

# Scatter plot
plt.scatter(x_values,y_values, color="green")

# Regression line
plt.plot(x_values,regress_values,"b-")
plt.annotate(line_eq,(5, 25),fontsize=15,color="blue")
plt.annotate(rvalue,(5,17),fontsize=15,color="red")

# Labels
plt.xlabel('Latitude')
plt.ylabel('Temperature (F)')
plt.title(f"Northern Hemisphere: Temperature vs Latitude Regression")

plt.grid()
plt.savefig("../output_data/Northern_Hemisphere_Temp_vs_Latitude_Regression.png")
plt.grid()

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_values = South_df['Lat'].astype('float')
y_values = South_df['Temp'].astype('float')

# Regression
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
rvalue = "R:Value=" + "  " + str(round(rvalue, 2))

# Scatter plot
plt.scatter(x_values,y_values, color="green")

# Regression line
plt.plot(x_values,regress_values,"b-")
plt.annotate(line_eq,(-50, 85),fontsize=15,color="blue")
plt.annotate(rvalue,(-50, 80),fontsize=15,color="red")

# Labels
plt.xlabel('Latitude')
plt.ylabel('Temperature (F)')
plt.title(f"Southern Hemisphere: Max Temp vs Latitude Regression")

plt.grid()
plt.savefig("../output_data/Southern_Hemisphere_Temp_vs_Latitude_Regression.png")
plt.grid()

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_values = North_df['Lat'].astype('float')
y_values = North_df['Humidity'].astype('float')

# Regression
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
rvalue = "R:Value =" + "  " + str(round(rvalue, 2))

# Scatter plot
plt.scatter(x_values,y_values, color="green")

# Regression line
plt.plot(x_values,regress_values,"b-")
plt.annotate(line_eq,(48,20),fontsize=15,color="blue")
plt.annotate(rvalue,(48, 10),fontsize=15,color="red")

# Labels
plt.xlabel('Latitude')
plt.ylabel('Humidity (%)')
plt.title(f"Northern Hemisphere: Humidity vs Latitude Regression")

plt.grid()
plt.savefig("../output_data/Northern_Hemisphere_Humidity_vs_Latitude_Regression.png")
plt.grid()

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_values = South_df['Lat'].astype('float')
y_values = South_df['Humidity'].astype('float')

# Regression
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
rvalue = "R:Value =" + "  " + str(round(rvalue, 2))

# Scatter plot
plt.scatter(x_values,y_values, color="green")

# Regression line
plt.plot(x_values,regress_values,"b-")
plt.annotate(line_eq,(-55,200),fontsize=15,color="blue")
plt.annotate(rvalue,(-55, 175),fontsize=15,color="red")

# Labels
plt.xlabel('Latitude')
plt.ylabel('Humidity (%)')
plt.title(f"Southern Hemisphere: Humidity vs Latitude Regression")

plt.grid()
plt.savefig("../output_data/Southern_Hemisphere_Humidity_vs_Latitude_Regression.png")
plt.grid()

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_values = North_df['Lat'].astype('float')
y_values = North_df['Cloudiness'].astype('float')

# Regression
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
rvalue = "R:Value =" + "  " + str(round(rvalue, 2))

# Scatter plot
plt.scatter(x_values,y_values, color="green")

# Regression line
plt.plot(x_values,regress_values,"b-")
plt.annotate(line_eq,(25,65),fontsize=15,color="blue")
plt.annotate(rvalue,(25, 55),fontsize=15,color="red")

# Labels
plt.xlabel('Latitude')
plt.ylabel('Cloudiness (%)')
plt.title(f"Northern Hemisphere: Cloudiness vs Latitude Regression")

plt.grid()
plt.savefig("../output_data/Northern_Hemisphere_Cloudiness_vs_Latitude_Regression.png")
plt.grid()

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_values = South_df['Lat'].astype('float')
y_values = South_df['Cloudiness'].astype('float')

# Regression
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
rvalue = "R:Value =" + "  " + str(round(rvalue, 2))

# Scatter plot
plt.scatter(x_values,y_values, color="green")

# Regression line
plt.plot(x_values,regress_values,"b-")
plt.annotate(line_eq,(-55,13),fontsize=15,color="blue")
plt.annotate(rvalue,(-55, 3),fontsize=15,color="red")

# Labels
plt.xlabel('Latitude')
plt.ylabel('Cloudiness (%)')
plt.title(f"Southern Hemisphere: Cloudiness vs Latitude Regression")

plt.grid()
plt.savefig("../output_data/Southern_Hemisphere_Cloudiness_vs_Latitude_Regression.png")
plt.grid()

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_values = North_df['Lat'].astype('float')
y_values = North_df['Wind Speed'].astype('float')

# Regression
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
rvalue = "R:Value =" + "  " + str(round(rvalue, 2))

# Scatter plot
plt.scatter(x_values,y_values, color="green")

# Regression line
plt.plot(x_values,regress_values,"b-")
plt.annotate(line_eq,(25,65),fontsize=15,color="blue")
plt.annotate(rvalue,(25, 55),fontsize=15,color="red")

# Labels
plt.xlabel('Latitude')
plt.ylabel('Wind Speed (mph)')
plt.title(f"Northern Hemisphere: Wind Speed vs Latitude Regression")

plt.grid()
plt.savefig("../output_data/Northern_Hemisphere_Wind_Speed_vs_Latitude_Regression.png")
plt.grid()

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_values = South_df['Wind Speed'].astype('float')
y_values = South_df['Cloudiness'].astype('float')

# Regression
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
rvalue = "R:Value =" + "  " + str(round(rvalue, 2))

# Scatter plot
plt.scatter(x_values,y_values, color="green")

# Regression line
plt.plot(x_values,regress_values,"b-")
plt.annotate(line_eq,(-55,13),fontsize=15,color="blue")
plt.annotate(rvalue,(-55, 3),fontsize=15,color="red")

# Labels
plt.xlabel('Latitude')
plt.ylabel('Wind Speed (mph)')
plt.title(f"Southern Hemisphere: Wind Speed vs Latitude Regression")

plt.grid()
plt.savefig("../output_data/Southern_Hemisphere_Wind_Speed_vs_Latitude_Regression.png")
plt.grid()