# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [18]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [21]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations -- added smaller sample to test
#lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lats = np.random.uniform(lat_range[0], lat_range[1], size=20)
#lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=20)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)
print(cities)

['grindavik', 'mahajanga', 'saldanha', 'rikitea', 'saskylakh', 'ushuaia', 'west bay', 'punta arenas', 'huarmey', 'tahta', 'jamestown', 'ketchikan', 'harper', 'barentsburg', 'belushya guba', 'shubarkuduk', 'kodiak', 'bluff']


### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [22]:
base_url = "http://api.openweathermap.org/data/2.5/weather?units=imperial&appid=" + weather_api_key + "&q="

print("Beginning Data Retrieval")
print("--------------------------------")

#set up lists to hold data retrieved in the for loop
temperature = []
humidity = []
cloudiness = []
wind = []
lat = []
good_city = []

cityCount = 0
# Build query URL
for city in cities:
    cityCount += 1
    print(f"Processing Record {cityCount} | {city}")
    try:
        weather_response = requests.get(base_url + city)
        weather_json = weather_response.json()
        lat.append(weather_json["coord"]["lat"])
        temperature.append(weather_json["main"]["temp"])
        humidity.append(weather_json["main"]["humidity"])
        cloudiness.append(weather_json["clouds"]["all"])
        wind.append(weather_json["wind"]["speed"])
        good_city.append(city)
    except: 
        print("City not found.  Skipping...")
 

Beginning Data Retrieval
--------------------------------
Processing Record 1 | grindavik
Processing Record 2 | mahajanga
Processing Record 3 | saldanha
Processing Record 4 | rikitea
Processing Record 5 | saskylakh
Processing Record 6 | ushuaia
Processing Record 7 | west bay
Processing Record 8 | punta arenas
Processing Record 9 | huarmey
Processing Record 10 | tahta
Processing Record 11 | jamestown
Processing Record 12 | ketchikan
Processing Record 13 | harper
Processing Record 14 | barentsburg
City not found.  Skipping...
Processing Record 15 | belushya guba
City not found.  Skipping...
Processing Record 16 | shubarkuduk
Processing Record 17 | kodiak
Processing Record 18 | bluff


### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [26]:
# Create the dictionary from the individual lists
city_dict = {
    "city": good_city,
    "lat": lat,
    "temp": temperature,
    "humidity": humidity,
    "cloudiness": cloudiness,
    "windspeed": wind
}

#Convert dictionary to dataframe
city_data = pd.DataFrame(weather_dict)

# Save the dataframe as a csv.
city_data.to_csv(output_data_file)

# Print the first five rows of the dataframe
city_data.head()

Unnamed: 0,city,lat,temp,humidity,cloudiness,windspeed
0,grindavik,63.84,23.0,57,0,3.36
1,mahajanga,-15.72,77.0,100,20,2.24
2,saldanha,-33.01,59.0,67,0,5.82
3,rikitea,-23.12,77.68,72,4,10.49
4,saskylakh,71.92,-1.46,91,100,10.47


## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [31]:
# Simple method to make sure humidity levels above 100 are dropped
clean_city_data = city_data.loc[city_data["humidity"] <= 100]

In [32]:
# print the first 5 again
clean_city_data.head()


Unnamed: 0,city,lat,temp,humidity,cloudiness,windspeed
0,grindavik,63.84,23.0,57,0,3.36
1,mahajanga,-15.72,77.0,100,20,2.24
2,saldanha,-33.01,59.0,67,0,5.82
3,rikitea,-23.12,77.68,72,4,10.49
4,saskylakh,71.92,-1.46,91,100,10.47


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression