# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []
nan=float('NaN')

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

626

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [3]:
# cities

In [10]:
# Create a dataframe from the cities, lat, and temp
weather_dict = ({
        "city": cities
})

# Add empty columns to fill
weather_dict["Lat"] = ""
weather_dict["Long"] = ""
weather_dict["Max Temp"] = ""
weather_dict["Humidity"] = ""
weather_dict["Cloudiness"] = ""
weather_dict["Wind Speed"] = ""


weather_data = pd.DataFrame(weather_dict)
clean = weather_data.replace('NULL', nan)
clean = clean.dropna()
weather_data.head()

Unnamed: 0,city,Lat,Long,Max Temp,Humidity,Cloudiness,Wind Speed
0,minab,,,,,,
1,tsihombe,,,,,,
2,kudahuvadhoo,,,,,,
3,san antonio,,,,,,
4,kapaa,,,,,,
...,...,...,...,...,...,...,...
621,khormuj,,,,,,
622,mehran,,,,,,
623,doha,,,,,,
624,kudat,,,,,,


In [9]:
# Create a params dict that will be updated with new city each iteration
params = {"key": weather_api_key}

url = "http://api.openweathermap.org/data/2.5/weather?&units=imperial"


# Loop through the weather_data and run a Lat/Long search for each city
for index, row in weather_data.iterrows():
    base_url = f"{url}&appid={weather_api_key}"
    my_city_url = base_url + '&q=' + city
#     print(my_city_url)

    city_name = row['city']
    
    # Make request
    city_lat_lng = requests.get(my_city_url, params=params)
    
    # Convert to json
    city_lat_lng = city_lat_lng.json()
#     city_lat_long

    try:
        weather_data.loc[index, "Lat"] = city_lat_lng['coor'][0]['lat']
        weather_data.loc[index, "Long"] = city_lat_lng['coor'][0]['lng']
        weather_data.loc[index, "Max Temp"] = city_lat_lng['main'][0]['temp']
        weather_data.loc[index, "Humidity"] = city_lat_lng['main'][0]['humidity']
        weather_data.loc[index, "Cloudiness"] = city_lat_lng['clouds'][0]['all']
        weather_data.loc[index, "Wind Speed"] = city_lat_lng['wind'][0]['speed']
        time.sleep(1)
    except (KeyError, ValueError):
        # Append null values
        print("Missing field...skipping.")

Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing fiel

Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing field...skipping.
Missing fiel

NameError: name 'response' is not defined

## Latitude vs. Temperature Plot

In [7]:
# Build a scatter plot for Temperature (F) vs. Latitude
plt.scatter(weather_data["lat"], weather_data["temp"], marker="o")

# Incorporate the other graph properties
plt.title("Temperature (F) vs. Latitude in World Cities")
plt.ylabel("Temperature (F)")
plt.xlabel("Latitude")
plt.grid(True)

KeyError: 'lat'

The "Temperature vs. Latitude in World Cities" scatter plot compares the temperature vs. the latitude of hundreds of cities around the world.

In [None]:
# Create a for loop for humidity and latitude
humidity = []
lat = []

for city in cities:
    my_city_url = base_url + '&q=' + city
#     print(my_city_url)
    response = requests.get(my_city_url).json()
    try:
        humidity.append(response['main']['humidity'])
        lat.append(response['coord']['lat'])
        time.sleep(1)
    except (KeyError, ValueError):
        # Append null values
        print("Missing field...skipping.")
    
# print(response)

In [None]:
# Create a dataframe from the cities, humidity, and lat
weather_dict = ({
        "city": cities,
        "lat": lat,
        "humidity": temp
})
weather_data = pd.DataFrame(weather_dict)
weather_data.head()

## Latitude vs. Humidity Plot

In [None]:
# Build a scatter plot for Humidity vs. Latitude
plt.scatter(weather_data["lat"], weather_data["humidity"], marker="o")

# Incorporate the other graph properties
plt.title("Humidity (%) vs Latitude in World Cities")
plt.ylabel("Humidity (%)")
plt.xlabel("Latitude")
plt.grid(True)

The "Humidity vs. Latitude in World Cities" scatter plot compares the humidity vs. the latitude of hundreds of cities around the world.

In [None]:
# Create a for loop for cloudiness and latitude
all = []
lat = []

for city in cities:
    my_city_url = base_url + '&q=' + city
#     print(my_city_url)

    response = requests.get(my_city_url).json()
    try:
        all.append(response['clouds']['all'])
        lat.append(response['coord']['lat'])
        time.sleep(1)
    except (KeyError, ValueError):
        # Append null values
        print("Missing field...skipping.")
    
print(response)

In [None]:
# Create a dataframe from the cities, humidity, and lat
weather_dict = ({
        "city": cities,
        "lat": lat,
        "clouds": all
})
weather_data = pd.DataFrame(weather_dict)
weather_data.head()

In [None]:
# Build a scatter plot for Cloudiness vs. Latitude
plt.scatter(weather_data["lat"], weather_data["clouds"], marker="o")

# Incorporate the other graph properties
plt.title("Cloudiness (%) vs Latitude in World Cities")
plt.ylabel("Cloudiness (%)")
plt.xlabel("Latitude")
plt.grid(True)

In [None]:
# Create a for loop for wind speed and latitude
speed = []
lat = []

for city in cities:
    my_city_url = base_url + '&q=' + city
#     print(my_city_url)
    
    response = requests.get(my_city_url).json()
    try:    
        speed.append(response['wind']['speed'])
        lat.append(response['coord']['lat'])
        time.sleep(1)
    except (KeyError, ValueError):
        # Append null values
        print("Missing field...skipping.")
    
print(response)

In [None]:
# Create a dataframe from the cities, wind speed, and lat
weather_dict = ({
        "city": cities,
        "lat": lat,
        "wind": speed
})
weather_data = pd.DataFrame(weather_dict)
weather_data.head()

In [None]:
# Build a scatter plot for Wind Speed (mph) (F) vs. Latitude
plt.scatter(weather_data["lat"], weather_data["wind"], marker="o")

# Incorporate the other graph properties
plt.title("Wind Speed (mph) vs Latitude in World Cities")
plt.ylabel("Wind Speed (mph)")
plt.xlabel("Latitude")
plt.grid(True)


### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression