# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [2]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
import seaborn as sns
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
original_output_df = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [3]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []


# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

589

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [4]:
# WEATHER_API URL: http://api.openweathermap.org/data/2.5/weather?appid=fc77fb30aacf15de2e57f6ad2f7b9786&units=metric&q=
url = "http://api.openweathermap.org/data/2.5/weather?"
units = "metric"


#Lists for holding weather data
temp = []
humidity = []
max_temp = []
cloudiness = []
windspeed = []
country = []
date = []
city2 = []

#Lat (y) | Long (x) 
lat = []
lng = []

#for loop numbers for Record number and Set numbers
number = 1 
set_num = 1

#Loop through cities for weather data
for city in cities[:500]:
    weather_url = f"{url}appid={weather_api_key}&units={units}&q=" + city
    weather_response = requests.get(weather_url)
    weather_json = weather_response.json()

    try:
        temp.append(weather_json['main']['temp'])
        humidity.append(weather_json['main']['humidity'])
        max_temp.append(weather_json['main']['temp_max'])
        cloudiness.append(weather_json['clouds']['all'])
        windspeed.append(weather_json['wind']['speed'])
        country.append(weather_json['sys']['country'])
        date.append(weather_json['dt'])
        lat.append(weather_json['coord']['lat'])
        lng.append(weather_json['coord']['lon'])
        city2.append(city)

            

        print(f"Processing Record {number} of Set of {set_num} | {city}")
        number = number + 1
        if number > 50:
            number = 0 
            set_num = set_num + 1 
            
    except:
        print("City not found. Skipping...")

Processing Record 1 of Set of 1 | te anau
Processing Record 2 of Set of 1 | tuktoyaktuk
Processing Record 3 of Set of 1 | santa isabel do rio negro
Processing Record 4 of Set of 1 | port hardy
Processing Record 5 of Set of 1 | barrow
Processing Record 6 of Set of 1 | hayden
Processing Record 7 of Set of 1 | cape town
Processing Record 8 of Set of 1 | lagoa
Processing Record 9 of Set of 1 | mount gambier
City not found. Skipping...
Processing Record 10 of Set of 1 | atuona
Processing Record 11 of Set of 1 | nyurba
Processing Record 12 of Set of 1 | port lincoln
Processing Record 13 of Set of 1 | longyearbyen
Processing Record 14 of Set of 1 | vaini
Processing Record 15 of Set of 1 | ostrovnoy
City not found. Skipping...
Processing Record 16 of Set of 1 | ushuaia
Processing Record 17 of Set of 1 | hamilton
Processing Record 18 of Set of 1 | kontagora
Processing Record 19 of Set of 1 | lebu
Processing Record 20 of Set of 1 | palu
Processing Record 21 of Set of 1 | hilo
Processing Record 2

Processing Record 23 of Set of 4 | gat
Processing Record 24 of Set of 4 | shimanovsk
City not found. Skipping...
Processing Record 25 of Set of 4 | saravan
City not found. Skipping...
Processing Record 26 of Set of 4 | santiago del estero
Processing Record 27 of Set of 4 | college
Processing Record 28 of Set of 4 | gazanjyk
Processing Record 29 of Set of 4 | strezhevoy
Processing Record 30 of Set of 4 | gornopravdinsk
Processing Record 31 of Set of 4 | karlskrona
Processing Record 32 of Set of 4 | tabou
Processing Record 33 of Set of 4 | vanavara
Processing Record 34 of Set of 4 | sao joao da barra
Processing Record 35 of Set of 4 | bengkulu
Processing Record 36 of Set of 4 | saint george
Processing Record 37 of Set of 4 | margate
Processing Record 38 of Set of 4 | fukue
Processing Record 39 of Set of 4 | axim
Processing Record 40 of Set of 4 | altay
Processing Record 41 of Set of 4 | sitka
City not found. Skipping...
City not found. Skipping...
Processing Record 42 of Set of 4 | loren

Processing Record 44 of Set of 7 | paita
Processing Record 45 of Set of 7 | mudanjiang
City not found. Skipping...
Processing Record 46 of Set of 7 | boueni
Processing Record 47 of Set of 7 | sabanalarga
Processing Record 48 of Set of 7 | lyngseidet
Processing Record 49 of Set of 7 | puerto princesa
Processing Record 50 of Set of 7 | toamasina
Processing Record 0 of Set of 8 | sorland
Processing Record 1 of Set of 8 | hirara
Processing Record 2 of Set of 8 | banda aceh
Processing Record 3 of Set of 8 | antofagasta
Processing Record 4 of Set of 8 | leh
Processing Record 5 of Set of 8 | vangaindrano
Processing Record 6 of Set of 8 | paramirim
Processing Record 7 of Set of 8 | beringovskiy
Processing Record 8 of Set of 8 | tutoia
Processing Record 9 of Set of 8 | souillac
Processing Record 10 of Set of 8 | mount isa
Processing Record 11 of Set of 8 | avera
Processing Record 12 of Set of 8 | sadao
Processing Record 13 of Set of 8 | fez
Processing Record 14 of Set of 8 | paamiut
Processing 

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [7]:
# create dataframe
weather_dict = {"City": city2,
                "Lat": lat,
                "Lng": lng,
                "Max Temp": max_temp,
                "Humidity": humidity,
                "Cloudiness": cloudiness,
                "Windspeed": windspeed,
                "Country": country,
                "Date": date,
                }
weather_data = pd.DataFrame(weather_dict)
weather_data.to_csv(original_output_df)
weather_data

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Windspeed,Country,Date
0,te anau,-45.4167,167.7167,5.23,94,61,1.58,NZ,1628623362
1,tuktoyaktuk,69.4541,-133.0374,11.00,66,75,5.14,CA,1628623362
2,santa isabel do rio negro,-0.4139,-65.0192,33.44,44,29,2.67,BR,1628623363
3,port hardy,50.6996,-127.4199,18.10,77,75,3.60,CA,1628623363
4,barrow,71.2906,-156.7887,3.01,89,90,4.12,US,1628623363
...,...,...,...,...,...,...,...,...,...
455,cananeia,-25.0147,-47.9267,27.91,48,100,1.43,BR,1628623509
456,progreso,21.2833,-89.6667,33.06,61,0,7.94,MX,1628623509
457,severnyy,50.6770,36.5532,23.02,46,75,3.00,RU,1628623510
458,kirakira,-10.4544,161.9205,25.58,87,24,5.33,SB,1628623510


In [None]:
weather_data.describe()

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

In [None]:
plt.scatter(weather_data["Lat"], 
            weather_data["Max Temp"],
            edgecolor="blue", linewidths=1, marker="o", 
            alpha=0.8, label="Cities")

# Incorporate the other graph properties
plt.title("City Latitude vs. Max Temperature (%s)" % time.strftime("%x"))
plt.ylabel("Max Temperature (F)")
plt.xlabel("Latitude")
plt.grid(True)
sns.set()

# Save the figure
plt.savefig("Latitude vs Temperature (F).png")

## Latitude vs. Humidity Plot

In [None]:
plt.scatter(weather_data["Lat"], 
            weather_data["Humidity"],
            edgecolor="green", linewidths=1, marker="o", 
            alpha=0.8, label="Cities")

# Incorporate the other graph properties
plt.title("City Latitude vs. Max Temperature (%s)" % time.strftime("%x"))
plt.ylabel("Max Temperature (F)")
plt.xlabel("Latitude")
plt.grid(True)
sns.set()

# Save the figure
plt.savefig("Latitude vs Temperature (F).png")

## Latitude vs. Cloudiness Plot

In [None]:
plt.scatter(weather_data["Lat"], 
            weather_data["Cloudiness"],
            edgecolor="purple", linewidths=1, marker="o", 
            alpha=0.8, label="Cities")

# Incorporate the other graph properties
plt.title("City Latitude vs. Max Temperature (%s)" % time.strftime("%x"))
plt.ylabel("Max Temperature (F)")
plt.xlabel("Latitude")
plt.grid(True)
sns.set()

# Save the figure
plt.savefig("Latitude vs Temperature (F).png")

## Latitude vs. Wind Speed Plot

In [None]:
plt.scatter(weather_data["Lat"], 
            weather_data["Windspeed"],
            edgecolor="blue", linewidths=1, marker="o", 
            alpha=0.8, label="Cities")

# Incorporate the other graph properties
plt.title("City Latitude vs. Max Temperature (%s)" % time.strftime("%x"))
plt.ylabel("Max Temperature (F)")
plt.xlabel("Latitude")
plt.grid(True)
sns.set()

# Save the figure
plt.savefig("Latitude vs Temperature (F).png")

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
#Cities on the Equator will be included in the Southern Hemisphere data. 
northern_lat = weather_data[weather_data['Lat'] > 0]
southern_lat = weather_data[weather_data['Lat'] <= 0]

In [None]:
x_values = northern_lat['Lat']
y_values = northern_lat['Max Temp']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Max Temperature')
plt.show()
print(f"R-squared: {rvalue**2:.6f}")

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_values = southern_lat['Lat']
y_values = southern_lat['Max Temp']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Max Temperature')
plt.show()
print(f"R-squared: {rvalue**2:.6f}")

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_values = northern_lat['Lat']
y_values = northern_lat['Humidity']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Humidity')
plt.show()
print(f"R-squared: {rvalue**2:.6f}")

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_values = southern_lat['Lat']
y_values = southern_lat['Humidity']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Humidity')
plt.show()
print(f"R-squared: {rvalue**2:.6f}")

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_values = northern_lat['Lat']
y_values = northern_lat['Cloudiness']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Cloudiness')
plt.show()
print(f"R-squared: {rvalue**2:.6f}")

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_values = southern_lat['Lat']
y_values = southern_lat['Cloudiness']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Cloudiness')
plt.show()
print(f"R-squared: {rvalue**2:.6f}")

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_values = northern_lat['Lat']
y_values = northern_lat['Windspeed']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Wind Speed')
plt.show()
print(f"R-squared: {rvalue**2:.6f}")

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_values = southern_lat['Lat']
y_values = southern_lat['Windspeed']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Windspeed')
plt.show()
print(f"R-squared: {rvalue**2:.6f}")