# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [52]:
%matplotlib inline

In [53]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
import os
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "../output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [54]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

In [55]:
# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count

len(cities)

44

In [56]:
#create intitial dataframe to hold cities
#cities_df = pd.DataFrame(cities, columns = ['city_name'])

In [57]:
#add additional columns to dataframes
#cities_df['weather'] = ""
#cities_df.head()

### Perform API Calls

* Perform a weather check on each city using a series of successive API calls.

* Include a print log of each city as it'sbeing processed (with the city number and city name).

In [58]:
# Save config information
url = "http://api.openweathermap.org/data/2.5/weather?"
units = "imperial"

# Build partial query URL
#query_url = f"{url}appid={api_key}&units={units}&q="
query_url = f"{url}appid={weather_api_key}&units={units}&q="

In [59]:
# set up lists to hold reponse info
#temp cities for testing
#cities = ["Sheboygan", "Chicago", "Miami"]
#city_id = []

In [60]:
#counter for city numbers
counter = 1

#variables for weather data frame
city_name = []
lat = []
long = []
temp_imperial = []
humidity = []
cloudiness = []
wind_speed = []

print('Beginning City Data Retrieval')
print('------------------------------')
# Loop through the list of cities and perform a request for data on each
for city in cities:
    
    try:
        #city = str.title()
        response = requests.get(query_url + city).json()
        city_name.append(response['name'])
        lat.append(response['coord']['lat'])
        long.append(response['coord']['lon'])
        temp_imperial.append(response['main']['temp'])
        humidity.append(response['main']['humidity'])
        cloudiness.append(response['clouds']['all'])
        wind_speed.append(response['wind']['speed'])
        #print result city
        print(f'Processing Record #{counter} of total #{len(cities)} results | {city}')
        #set counter
        counter = counter + 1
    except (KeyError, IndexError):
        print(f"City data for record #{counter} of total #{len(cities)} results not found. Skipping...")
        counter = counter + 1


#("city")str.title()
print('------------------------------')
print('End of City Data Retrieval')
print('------------------------------')

Beginning City Data Retrieval
------------------------------
Processing Record #1 of total #44 results | sarankhola
Processing Record #2 of total #44 results | bredasdorp
Processing Record #3 of total #44 results | jamestown
Processing Record #4 of total #44 results | port elizabeth
Processing Record #5 of total #44 results | sabzevar
Processing Record #6 of total #44 results | sao joao da barra
Processing Record #7 of total #44 results | victoria
Processing Record #8 of total #44 results | fairbanks
Processing Record #9 of total #44 results | mataura
Processing Record #10 of total #44 results | albany
Processing Record #11 of total #44 results | tura
Processing Record #12 of total #44 results | poyarkovo
Processing Record #13 of total #44 results | hearst
Processing Record #14 of total #44 results | ushuaia
City data for record #15 of total #44 results not found. Skipping...
Processing Record #16 of total #44 results | hobart
Processing Record #17 of total #44 results | brae
Processin

### Convert Raw Data to DataFrame

In [112]:
city_data_df = pd.DataFrame({'City': city_name,
                            'Latitude': lat,
                            'Longitude': long,
                            'Temp': temp_imperial,
                            'Humidity': humidity,
                            'Cloudiness': cloudiness,
                            'Wind Speed': wind_speed
                            })

* Export the city data into a .csv.

In [113]:
pd.DataFrame.to_csv(city_data_df, '../output_data/city_weather_data.csv')

* Display the DataFrame

In [114]:
city_data_df.head()

Unnamed: 0,City,Latitude,Longitude,Temp,Humidity,Cloudiness,Wind Speed
0,Sarankhola,22.31,89.79,81.05,90,95,4.12
1,Bredasdorp,-34.53,20.04,48.2,76,0,5.82
2,Jamestown,42.1,-79.24,78.8,57,1,6.93
3,Port Elizabeth,-33.92,25.57,55.4,37,0,4.7
4,Sabzawār,36.21,57.68,78.58,31,0,15.39


## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [119]:
city_data_h_humid = city_data_df[city_data_df['Humidity'] > 99]
city_data_h_humid

Unnamed: 0,City,Latitude,Longitude,Temp,Humidity,Cloudiness,Wind Speed


In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


In [None]:
# Extract relevant fields from the data frame


# Export the City_Data into a csv


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

In [None]:
# OPTIONAL: Create a function to create Linear Regression plots

In [None]:
# Create Northern and Southern Hemisphere DataFrames

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression