# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [2]:
!pip install citipy



In [3]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress
from pprint import pprint

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

ModuleNotFoundError: No module named 'api_keys'

## Generate Cities List

In [None]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it's being processed (with the city number and city name).


In [None]:
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=a3ce22e55582bde8a2988a3345e2c8d6"

# Lists for DataFrame
city_two = []
cloudinesses = []
dates = []
humidities = []
lats = []
lngs = []
max_temps = []
wind_speeds = []
countries = []

# Set Count Quantities 
count_one = 0
set_one = 1

# Create DataFrame Columns
for city in cities:
    
    try:
        TestCity = url + "&q=" + city
        response = requests.get(TestCity).json()
        cloudinesses.append(response['clouds']['all'])
        countries.append(response['sys']['country'])
        dates.append(response['dt'])
        humidities.append(response['main']['humidity'])
        lats.append(response['coord']['lat'])
        lngs.append(response['coord']['lon'])
        max_temps.append(response['main']['temp_max'])
        wind_speeds.append(response['wind']['speed'])
        if count_one > 48:
            count_one = 1
            set_one += 1
            city_two.append(city)
        else:
            count_one += 1
            city_two.append(city)
        print(f"Processing Record {count_one} of Set {set_one} | {city}")
    except Exception:
        print("Skipping no city found")

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [None]:
# Create Dictionary for DataFrame

weatherdictionary = {"City":city_two, "Cloudiness":cloudinesses, "Country":countries, "Date":dates, 
                     "Humidity":humidities, "Lat":lats, "Lng":lngs, "Max Temp":max_temps,"Wind Speed":wind_speeds}

# Create DataFrame
weatherdataframe = pd.DataFrame(weatherdictionary)
weatherdataframe.head()

In [None]:
# Export City Data Into a CSV

weatherdataframe.to_csv("output.csv")
weatherdataframe.count()

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.

weatherdataframe.describe()

In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


In [None]:
# Extract relevant fields from the data frame


# Export the City_Data into a csv


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

In [None]:
plt.scatter(weatherdataframe["Lat"],weatherdataframe["Max Temp"])
plt.title("Latitude vs. Maximum Temperature")
plt.xlabel("Latitude")
plt.ylabel("Maximum Temperature (F)")
plt.grid(True)
plt.savefig("figure1.png")
plt.show()

## Latitude vs. Humidity Plot

In [None]:
plt.scatter(weatherdataframe["Lat"],weatherdataframe["Humidity"])
plt.title("Latitude vs. Humidity")
plt.xlabel("Latitude")
plt.ylabel("Humidity (%)")
plt.grid(True)
plt.savefig("figure2.png")
plt.show()

## Latitude vs. Cloudiness Plot

In [None]:
plt.scatter(weatherdataframe["Lat"],weatherdataframe["Cloudiness"])
plt.title("Latitude vs. Cloudiness")
plt.xlabel("Latitude")
plt.ylabel("Cloudiness")
plt.grid(True)
plt.savefig("figure3.png")
plt.show()

## Latitude vs. Wind Speed Plot

In [None]:
plt.scatter(weatherdataframe["Lat"],weatherdataframe["Wind Speed"])
plt.title("Latitude vs. Wind Speed")
plt.xlabel("Latitude")
plt.ylabel("Wind Speed")
plt.ylim(-2, 34)
plt.grid(True)
plt.savefig("figure4.png")
plt.show()

## Data Analysis

## Linear Regression

In [None]:
# OPTIONAL: Create a function to create Linear Regression plots

In [None]:
# Create Northern and Southern Hemisphere DataFrames

northernhemi = weatherdataframe.loc[(weatherdataframe["Lat"] >= 0)]
southernhemi = weatherdataframe.loc[(weatherdataframe["Lat"] <= 0)]

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
northernmaxtemp = northernhemi["Max Temp"]
northernlatitude = northernhemi["Lat"]

In [None]:
slope, intercept, r_value, p_value, std_err = linregress(northernlatitude, northernmaxtemp)
print("slope: %f    intercept: %f" % (slope, intercept))
print("R-squared: %f" % r_value**2)

In [None]:
plt.plot(northernlatitude, northernmaxtemp, 'o')
plt.plot(northernlatitude, intercept + slope*northernlatitude, 'r')
plt.title("Northern Hemisphere: Max Temp vs. Latitude")
plt.xlabel("Latitude")
plt.ylabel("Max Temp")
plt.legend()
print("R-squared: %f" % r_value**2)
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.annotate(line_eq,(10,30),fontsize=15,color="red")
plt.show()

plt.savefig("figur4.png")


####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
southernmaxtemp = southernhemi["Max Temp"]
southernlatitude = southernhemi["Lat"]

In [None]:
slope, intercept, r_value, p_value, std_err = linregress(southernlatitude, southernmaxtemp)
print("slope: %f    intercept: %f" % (slope, intercept))
print("R-squared: %f" % r_value**2)

In [None]:
plt.plot(southernlatitude, southernmaxtemp, 'o')
plt.plot(southernlatitude, intercept + slope*southernlatitude, 'r')
plt.title("Southern Hemisphere: Max Temp vs. Latitude")
plt.xlabel("Latitude")
plt.ylabel("Max Temp")
plt.legend()
print("R-squared: %f" % r_value**2)
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.annotate(line_eq,(10,30),fontsize=15,color="red")
plt.show()

plt.savefig("figure5.png")


####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
northernhumid = northernhemi["Humidity"]
northernlatitude = northernhemi["Lat"]

In [None]:
slope, intercept, r_value, p_value, std_err = linregress(northernlatitude, northernhumid)
print("slope: %f    intercept: %f" % (slope, intercept))
print("R-squared: %f" % r_value**2)

In [None]:
plt.plot(northernlatitude, northernhumid, 'o')
plt.plot(northernlatitude, intercept + slope*northernlatitude, 'r')
plt.title("Northern Hemisphere: Latitude vs Humidity")
plt.xlabel("Latitude")
plt.ylabel("Humidity")
plt.legend()
print("R-squared: %f" % r_value**2)
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.annotate(line_eq,(10,30),fontsize=15,color="red")
plt.show()

plt.savefig("figur6.png")


####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
southernhumid = southernhemi["Humidity"]
southernlatitude = southernhemi["Lat"]

In [None]:
slope, intercept, r_value, p_value, std_err = linregress(southernlatitude, southernhumid)
print("slope: %f    intercept: %f" % (slope, intercept))
print("R-squared: %f" % r_value**2)

In [None]:
plt.plot(southernlatitude, southernhumid, 'o')
plt.plot(southernlatitude, intercept + slope*southernlatitude, 'r')
plt.title("Southern Hemisphere: Latitude vs Humidity")
plt.xlabel("Latitude")
plt.ylabel("Humidity")
plt.legend()
print("R-squared: %f" % r_value**2)
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.annotate(line_eq,(10,30),fontsize=15,color="red")
plt.show()

plt.savefig("figure7.png")


####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
northernlatitude = northernhemi["Lat"]
northerncloudiness = northernhemi["Cloudiness"]

slope, intercept, r_value, p_value, std_err = linregress(northernlatitude, northerncloudiness)
print("slope: %f    intercept: %f" % (slope, intercept))
print("R-squared: %f" % r_value**2)

In [None]:
plt.plot(northernlatitude, northerncloudiness, 'o')
plt.plot(northernlatitude, intercept + slope*northernlatitude, 'r')
plt.title("Northern Hemisphere: Latitude vs Cloudiness")
plt.xlabel("Latitude")
plt.ylabel("Cloudiness")
plt.legend()
print("R-squared: %f" % r_value**2)
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.annotate(line_eq,(10,30),fontsize=15,color="red")
plt.show()

plt.savefig("figure8.png")


####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
southernlatitude = southernhemi["Lat"]
southerncloudiness = southernhemi["Cloudiness"]

slope, intercept, r_value, p_value, std_err = linregress(southernlatitude, southerncloudiness)
print("slope: %f    intercept: %f" % (slope, intercept))
print("R-squared: %f" % r_value**2)

In [None]:
plt.plot(southernlatitude, southerncloudiness, 'o')
plt.plot(southernlatitude, intercept + slope*southernlatitude, 'r')
plt.title("Southern Hemisphere: Latitude vs Cloudiness")
plt.xlabel("Latitude")
plt.ylabel("Cloudiness")
plt.legend()
print("R-squared: %f" % r_value**2)
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.annotate(line_eq,(10,30),fontsize=15,color="red")
plt.show()

plt.savefig("figure9.png")

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
northernlatitude = northernhemi["Lat"]
northernwindspeed = northernhemi["Wind Speed"]

slope, intercept, r_value, p_value, std_err = linregress(northernlatitude, northernwindspeed)
print("slope: %f    intercept: %f" % (slope, intercept))
print("R-squared: %f" % r_value**2)

In [None]:
plt.plot(northernlatitude, northernwindspeed, 'o')
plt.plot(northernlatitude, intercept + slope*northernlatitude, 'r')
plt.title("Northern Hemisphere: Latitude vs Wind Speed")
plt.xlabel("Latitude")
plt.ylabel("Wind Speed")
plt.legend()
print("R-squared: %f" % r_value**2)
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.annotate(line_eq,(10,30),fontsize=15,color="red")
plt.show()

plt.savefig("figure10.png")

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
southernlatitude = southernhemi["Lat"]
southernwindspeed = southernhemi["Wind Speed"]

slope, intercept, r_value, p_value, std_err = linregress(southernlatitude, southernwindspeed)
print("slope: %f    intercept: %f" % (slope, intercept))
print("R-squared: %f" % r_value**2)

In [None]:
plt.plot(southernlatitude, southernwindspeed, 'o')
plt.plot(southernlatitude, intercept + slope*southernlatitude, 'r')
plt.title("SouthernHemisphere: Latitude vs Wind Speed")
plt.xlabel("Latitude")
plt.ylabel("Wind Speed")
plt.legend()
print("R-squared: %f" % r_value**2)
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.annotate(line_eq,(10,30),fontsize=15,color="red")
plt.show()

plt.savefig("figure11.png")