# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
import json
from scipy import stats
from scipy.stats import linregress
import pprint as pprint

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)


In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

629

## Generate Cities List

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [3]:
# Save config information.
base = "http://api.openweathermap.org/data/2.5/weather?" 
units = "metric"

# Build partial query URL

url = f'{base}appid={weather_api_key}&units={units}&q='
response = requests.get(url + city)
weather = response.json()
print(json.dumps(weather, indent =4))

{
    "cod": 429,
    "message": "Your account is temporary blocked due to exceeding of requests limitation of your subscription type. Please choose the proper subscription http://openweathermap.org/price"
}


### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [4]:
#create a City dataframe
citydf = pd.DataFrame({'City': cities})
citydf

Unnamed: 0,City
0,tumannyy
1,jamestown
2,arica
3,thompson
4,kapaa
...,...
624,batken
625,san cristobal
626,payo
627,naumburg


In [5]:
#citydf["Country"] = ""
#citydf["Latitude"] = ""
#citydf["Longitude"] = ""
#citydf["Temperature (F)"] = ""
#citydf["Humidity"] = ""
#citydf["Cloudiness"] = ""
#citydf["Wind Speed (mph)"] = ""
place =[]
country = []
latitude = []
longitude = []
temperature = []
humidity = []
cloudiness=[]
wind_speed= []
city_data = []


In [6]:
# Save config information.
base = "http://api.openweathermap.org/data/2.5/weather?" 
units = "metric"


city_data = []

for city in cities:
    url = f'{base}appid={weather_api_key}&units={units}&q='
    print(f" Found this {city}")
    try:
        response = requests.get(url + city).json()
        country = response["sys"]["country"]
        latitude= response["coord"]["lat"]
        longitude =response["coord"]["lon"]
        temperature = response["main"]["temp"]
        humidity =response["main"]["humidity"]
        cloudiness= response["clouds"]["all"]
        wind_speed=response["wind"]["speed"]
        city_data.append({"City":city, "Country": country, 'Latitude':latitude, 
                          "Longitude": longitude, "Temperature": temperature, "Humidity": humidity,
                         "Cloudiness": cloudiness, "Windspeed": wind_speed})

    except:
        print("Country not found")




 Found this tumannyy
Country not found
 Found this jamestown
Country not found
 Found this arica
Country not found
 Found this thompson
Country not found
 Found this kapaa
Country not found
 Found this banda aceh
Country not found
 Found this busselton
Country not found
 Found this saint george
Country not found
 Found this guerrero negro
Country not found
 Found this atherton
Country not found
 Found this rikitea
Country not found
 Found this ushuaia
Country not found
 Found this pleasanton
Country not found
 Found this tabiauea
Country not found
 Found this tasiilaq
Country not found
 Found this avarua
Country not found
 Found this tautira
Country not found
 Found this roura
Country not found
 Found this albany
Country not found
 Found this hilo
Country not found
 Found this barrow
Country not found
 Found this hithadhoo
Country not found
 Found this chapais
Country not found
 Found this bredasdorp
Country not found
 Found this aflu
Country not found
 Found this atuona
Country not fo

In [7]:
weatherdf =pd.DataFrame(city_data)
weatherdf["Temperature"] = round(1.8 * weatherdf['Temperature'] + 32,2)
weatherdf

KeyError: 'Temperature'

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#no cities over 100% humidity
overhum = dataframe[dataframe["Humidity"]>100]
overhum

In [None]:
#  Get the indices of cities that have humidity over 100%.
#N/A

In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


In [None]:
#N/A

## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

In [8]:
#scatterplot Temp vs Latitude

plt.scatter(weatherdf["Latitude"], weatherdf["Temperature"], facecolors = 'blue', marker = 'o')

plt.title("City Latitude vs Temperature (F)")
plt.xlabel("City Latitude")
plt.ylabel("City Temperature (F)")

plt.show()
#Observation: The closer the city is to the equator, the higher the temperature. 
#Also, the northern hemisphere cities are getting colder than the southern hemispherer cities.
#Factors to consider:  Winter vs Summer in the hemispheres.

KeyError: 'Latitude'

## Latitude vs. Humidity Plot

In [None]:
plt.scatter(weatherdf["Latitude"], weatherdf["Humidity"], facecolors = 'blue', marker = 'o')

plt.title("Latitude vs Humidity %")
plt.xlabel("City Latitude")
plt.ylabel("City Humidity %")

plt.show()
#Observation: The cities closest to the equator does not necessarily mean the humidity percentage is higher.  
#If fact, some cities closer to the equator are less humidity right now than other cities. 
#Factors to consider:  Winter vs Summer in the hemispheres.

## Latitude vs. Cloudiness Plot

In [None]:
plt.scatter(weatherdf["Latitude"], weatherdf["Cloudiness"], facecolors = 'blue', marker = 'o')

plt.title("Latitude vs Cloudiness %")
plt.xlabel("City Latitude")
plt.ylabel("Cloudiness %")

plt.show()
#Observations: Cities tend to have more 0% cloudiness or 100% than anything in between no matter the city's latitude.

## Latitude vs. Wind Speed Plot

In [None]:
plt.scatter(weatherdf["Latitude"], weatherdf["Windspeed"], facecolors = 'blue', marker = 'o')

plt.title("Latitude vs Wind Speed (mph)")
plt.xlabel("City Latitude")
plt.ylabel("Wind Speed (mph)")

plt.show()
#Observations: The city's latitude does not have a high correlation with the wind speed in that city. Most city's wind blows at about 5mph or lower each day.

## Linear Regression

In [None]:
#dataframe for just North Hemisphere
northtemp = dataframe[dataframe["Latitude"]>0]


####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
#define the axis
x_values = northtemp['Latitude']
y_values = northtemp['Temperature']

# Perform a linear regression on temperature vs. latitude
(slope, intercept, rvalue, pvalue, stderr) = stats.linregress(x_values, y_values)

#define regression values
regress_values = x_values * slope + intercept
#print(regress_values)
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
print(line_eq)
stats.linregress(x_values, y_values)

In [None]:
plt.plot(x_values,regress_values,"r-")

# Label plot and annotate the line equation
plt.title("North Hemisphere: City Latitude vs Temperature (F)")
plt.xlabel(' City Latitude')
plt.ylabel('City Temperature (F)')
plt.annotate(line_eq,(20,15),fontsize=16,color="blue")

# Print r value by squaring it
print(f"The r value is: {rvalue**2}")

# Show plot
plt.show()

In [None]:
plt.scatter(x_values, y_values, facecolors = 'blue', marker = 'o')
plt.title("North Hemisphere: City Latitude vs Temperature (F)")
plt.xlabel("City Latitude")
plt.ylabel("City Temperature (F)")

plt.show()
#Observations: The further away from the equator, the clolder the temperature. (drops in a linear way) 

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
#define souhern hemisphere dataframe
southtemp = dataframe[dataframe["Latitude"]<0]
southtemp 

In [None]:
#define the axis
x_values = southtemp['Latitude']
y_values = southtemp['Temperature']

# Perform a linear regression on temperature vs. latitude
(slope, intercept, rvalue, pvalue, stderr) = stats.linregress(x_values, y_values)

#define regression values
regress_values = x_values * slope + intercept
#print(regress_values)
line_eq = "y = " + str(round(slope,2)) + "x +" + str(round(intercept,2))
print(line_eq)
stats.linregress(x_values, y_values)

In [None]:
plt.plot(x_values,regress_values,"r-")

# Label plot and annotate the line equation
plt.title("North Hemisphere: City Latitude vs Temperature (F)")
plt.xlabel(' City Latitude')
plt.ylabel('City Temperature (F)')
plt.annotate(line_eq,(20,15),fontsize=16,color="blue")

# Print r value by squaring it
print(f"The r value is: {rvalue**2}")

# Show plot
plt.show()

In [None]:
#scatterplot southern hemisphere latitude vs temperature
plt.scatter(southtemp["Latitude"], southtemp["Temperature"], facecolors = 'blue', marker = 'o')
plt.title("South Hemisphere: City Latitude vs Temperature (F)")
plt.xlabel("City Latitude")
plt.ylabel("City Temperature (F)")

plt.show()
#Observations: The cities in the souther hemisphere show an decrease in temperature as they get further from the equator.
#The correlation isn't as strong as the northern hemisphere. 

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
plt.scatter(northtemp["Latitude"], northtemp["Humidity"], facecolors = 'blue', marker = 'o')

plt.title("North Hemisphere: City Latitude vs Humdity (%)")
plt.xlabel("City Latitude")
plt.ylabel("City Humdity (%)")

plt.show()
#Observations: The further away from the equator, the clolder the temperature. (drops in a linear way)

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
plt.scatter(southtemp["Latitude"], southtemp["Humidity"], facecolors = 'blue', marker = 'o')

plt.title("South Hemisphere: City Latitude vs Humidity (%)")
plt.xlabel("City Latitude")
plt.ylabel("City Humidity (%)")

plt.show()

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
plt.scatter(northtemp["Latitude"], northtemp["Cloudiness"], facecolors = 'blue', marker = 'o')

plt.title("North Hemisphere: City Latitude vs Cloudiness %")
plt.xlabel("City Latitude")
plt.ylabel("City Cloudiness %")
plt.show()

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
plt.scatter(southtemp["Latitude"], southtemp["Humidity"], facecolors = 'blue', marker = 'o')

plt.title("South Hemisphere: City Latitude vs Cloudiness %")
plt.xlabel("City Latitude")
plt.ylabel("City Cloudiness %")

plt.show()

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
plt.scatter(northtemp["Latitude"], northtemp["Windspeed"], facecolors = 'blue', marker = 'o')

plt.title("North Hemisphere: City Latitude vs Windspeed (mph)")
plt.xlabel("City Latitude")
plt.ylabel("City Windspeed (mph)")
plt.show()

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
plt.scatter(southtemp["Latitude"], southtemp["Windspeed"], facecolors = 'blue', marker = 'o')

plt.title("South Hemisphere: City Latitude vs Windspeed (mph)")
plt.xlabel("City Latitude")
plt.ylabel("City Windspeed (mph)")

plt.show()