# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [6]:
import json
import requests
from api_key import weather_api_key
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
from citipy import citipy
from scipy.stats import linregress
from sklearn import datasets

## Generate Cities List

In [10]:
latitude_range = (-80,80)
long_range = (-180, 180)
lat_lngs = []

cities = []

lat = np.random.uniform(latitude_range[0],latitude_range[1], size = 2000)
lng = np.random.uniform(long_range[0],long_range[1], size = 2000)
lat_lngs = zip(lat, lng)



for lat_lng in lat_lngs:
    location = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    #location = location.replace(" ", "%20")
    if location not in cities:
        cities.append(location)
len(cities)
print(cities)

['mildura', 'northampton', 'tuktoyaktuk', 'shingu', 'butaritari', 'luderitz', 'guerrero negro', 'torbay', 'mehamn', 'samalaeulu', 'busselton', 'punta arenas', 'waitati', 'hobart', 'port lincoln', 'utiroa', 'shaunavon', 'thompson', 'fairbanks', 'mar del plata', 'balkanabat', 'vaitupu', 'lompoc', 'ngunguru', 'nikolskoye', 'mataura', 'cape town', 'vila', 'suntar', 'meulaboh', 'andevoranto', 'aklavik', 'east london', 'marienburg', 'ribeira grande', 'itarema', 'larsnes', 'kearney', 'rikitea', 'rio grande', 'tara', 'taolanaro', 'bluff', 'karaton', 'hasaki', 'rock sound', 'mumford', 'longyearbyen', 'belaya gora', 'avarua', 'kati', 'new norfolk', 'illoqqortoormiut', 'vanavara', 'sentyabrskiy', 'pacific grove', 'castro', 'arraial do cabo', 'komsomolskiy', 'buta', 'carnarvon', 'fomboni', 'saldanha', 'chuy', 'san cristobal', 'atuona', 'zyryanskoye', 'hilo', 'belushya guba', 'lebu', 'bow island', 'chokurdakh', 'tabou', 'saskylakh', 'san felipe', 'kainantu', 'amambai', 'preeceville', 'puerto escond

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [14]:


url = "http://api.openweathermap.org/data/2.5/weather?"
units = "metric"
query_url = f"{url}appid={weather_api_key}&units={units}&q="

 

longitude = []
latitude = []
temp_max = []
humidity = []
cloudiness = []
windspeed = []
country = []
date = []

record = 1

for city in cities:
    response = requests.get(query_url + city).json()
    longitude.append(response['coord']['lon'])
    latitude.append(response['coord']['lat'])
    temp_max.append(response['main']['temp_max'])
    humidity.append(response['main']['humidity'])
    cloudiness.append(response['clouds']['all'])
    windspeed.append(response['wind']['speed'])
    country.append(response['sys']['country'])
    date.append(response['dt'])
    print(f"Processing Record {record} of set 1 | {city}")
    
    record += 1





TypeError: can only concatenate str (not "tuple") to str

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [4]:
weather_data_dict = {"City":cities, "Lat":latitude,
                           "Lng":longitude, "Max Temp":temp_max,
                            "Humidity":humidity,"Cloudiness":cloudiness, "Wind Speed":windspeed,
                            "Country":country, "Date":date}


weather_data = pd.DataFrame(weather_data_dict)

weather_data.describe()

               

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
count,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
mean,,,,,,,,,
std,,,,,,,,,
min,,,,,,,,,
25%,,,,,,,,,
50%,,,,,,,,,
75%,,,,,,,,,
max,,,,,,,,,


In [5]:
weather_data.to_csv('Output_csv/weather_data.csv')

FileNotFoundError: [Errno 2] No such file or directory: 'Output_csv/weather_data.csv'

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
clean_city_data = weather_data.drop(weather_data[weather_data['Humidity'] > 100].index, inplace = True) 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

In [None]:
plt.scatter(clean_city_data['Latitude'], clean_city_data['Max Temp'], marker='o', s=10)
plt.title("City Latitude Vs. Max Temp")
plt.ylabel("Max Temp")
plt.xlabel("Latitude")
plt.savefig("Output_plots/Max_Temp_VS_Lat.png")

## Latitude vs. Humidity Plot

In [None]:
plt.scatter(clean_city_data['Latitude'], clean_city_data['Humidity'], marker='o', s=10)
plt.title("City Latitude Vs. Humidity")
plt.ylabel("Humidity")
plt.xlabel("Latitude")
plt.savefig("Output_plots/Max_Temp_VS_Lat.png")

## Latitude vs. Cloudiness Plot

In [None]:
plt.scatter(clean_city_data['Latitude'], clean_city_data['Cloudiness'], marker='o', s=10)
plt.title("City Latitude Vs. Cloudiness")
plt.ylabel("Cloudiness")
plt.xlabel("Latitude")
plt.savefig("Output_plots/Max_Temp_VS_Lat.png")

## Latitude vs. Wind Speed Plot

In [None]:
plt.scatter(clean_city_data['Latitude'], clean_city_data['Wind Speed'], marker='o', s=10)
plt.title("City Latitude Vs. Wind Speed")
plt.ylabel("Wind Speed")
plt.xlabel("Latitude")
plt.savefig("Output_plots/Max_Temp_VS_Lat.png")

## Linear Regression

In [None]:
North_data = clean_city_data.drop(clean_city_data[clean_city_data['Latitude'] > 0].index, inplace = True)
South_data = clean_city_data.drop(clean_city_data[clean_city_data['Latitude'] < 0].index, inplace = True)

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_values = North_data['Latitude']
y_values = North_data['Max Temp']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(0,50),fontsize=15,color="red")
plt.xlabel('Northern Latitude')
plt.ylabel('Max Temp')
print(f"The r-squared is: {rvalue**2}")
plt.show()

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_values = South_data['Latitude']
y_values = South_data['Max Temp']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(0,50),fontsize=15,color="red")
plt.xlabel('Southern Latitude')
plt.ylabel('Max Temp')
print(f"The r-squared is: {rvalue**2}")
plt.show()

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_values = North_data['Humidity']
y_values = North_data['Max Temp']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(0,50),fontsize=15,color="red")
plt.xlabel('Northern Latitude')
plt.ylabel('Max Temp')
print(f"The r-squared is: {rvalue**2}")
plt.show()

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_values = South_data['Latitude']
y_values = South_data['Humidity']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(0,50),fontsize=15,color="red")
plt.xlabel('Southern Latitude')
plt.ylabel('Humidity')
print(f"The r-squared is: {rvalue**2}")
plt.show()

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_values = North_data['Latitude']
y_values = North_data['Cloudiness']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(0,50),fontsize=15,color="red")
plt.xlabel('Northern Latitude')
plt.ylabel('Cloudiness')
print(f"The r-squared is: {rvalue**2}")
plt.show()

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_values = South_data['Latitude']
y_values = South_data['Cloudiness']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(0,50),fontsize=15,color="red")
plt.xlabel('Southern Latitude')
plt.ylabel('Cloudiness')
print(f"The r-squared is: {rvalue**2}")
plt.show()

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_values = North_data['Latitude']
y_values = North_data['Wind Speed']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(0,50),fontsize=15,color="red")
plt.xlabel('Northern Latitude')
plt.ylabel('Wind Speed')
print(f"The r-squared is: {rvalue**2}")
plt.show()

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_values = South_data['Latitude']
y_values = South_data['Wind Speed']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(0,50),fontsize=15,color="red")
plt.xlabel('Southern Latitude')
plt.ylabel('Wind Speed')
print(f"The r-squared is: {rvalue**2}")
plt.show()