# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [None]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

636

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [None]:
#citipy
weather_df = pd.DataFrame({'City': cities})

#add additional blank columns to store information from openweathermap api

weather_df['Latitude'] = ''
weather_df['Longitude'] = ''
weather_df['Max Temperature (F)'] = ''
weather_df['Humidity (%)'] = ''
weather_df['Cloudiness (%)'] = ''
weather_df['Wind Speed (mph)'] = ''
weather_df["Country"] = ''
weather_df['Date'] = ''

# keeps count of those cities whose weather information is successfully obtained
city_count = 0

# initializing # of variables
api_call_count = 1 # count for API calls made to OpenWeatherAPI, max 60 counts allowed for free API calls
sets = 0 # counter to count the number of call sets
t0 = time.time() # get current time

#loop through all rows and fill in values for blank columns in dataframe
for index,row in weather_df.iterrows():
    city_name = row['City']
    country_id = row['Country']
    
    # create a dictionary to contain the query parameters
   
    
    search_parameters = {
        "q": str(city_name)+","+str(country_id),
        "units": "IMPERIAL",
        "mode": "json",
        "APPID": weather_api_key
    }
    
    #api call for all Cities 
    xweather_response = requests.get(query_url).json()
    xquery_url = base_url + "appid=" + weather_api_key + "&q=" + city
    
    base_url = "http://api.openweathermap.org/data/2.5/weather"
    weather_response = requests.get(base_url, params = search_parameters).json()
    
    try:
        weather_df.loc[index,'Latitude'] = weather_response['coord']['lat']
        weather_df.loc[index,'Longitude'] = weather_response['coord']['lon']
        weather_df.loc[index,'Max Temperature (F)'] = weather_response['main']['temp_max']
        weather_df.loc[index,'Humidity (%)'] = weather_response['main']['humidity']
        weather_df.loc[index,'Cloudiness (%)'] = weather_response['clouds']['all']
        weather_df.loc[index,'Wind Speed (mph)'] = weather_response['wind']['speed']
        weather_df.loc[index, 'Date'] = weather_response['dt']
        
        #print log for each city
        print(f'Processing Record {api_call_count} of Set {sets} | {city_name}' )
        
        city_count = city_count + 1 # only increment if you get all the weather information
    
    except KeyError:
        weather_df.loc[index,'Latitude'] = np.nan
        weather_df.loc[index,'Longitude'] = np.nan
        weather_df.loc[index,'Max Temperature (F)'] = np.nan
        weather_df.loc[index,'Humidity (%)'] = np.nan
        weather_df.loc[index,'Cloudiness (%)'] = np.nan
        weather_df.loc[index,'Wind Speed (mph)'] = np.nan
        weather_df.loc[index,'Date'] = np.nan
        print(f"City not found. Skipping...") #deleted {city}
    api_call_count = api_call_count + 1        
    if api_call_count == 51: # loop to limit 50 API calls per minute. The OpenWeatherMap API limit is 60 calls/min
        t1 = time.time()
        api_call_count = 1 # reset it for next 50 calls
        sets = sets+1
        time.sleep(60-(t1-t0))
        t0 = time.time()
print(f"Processing successfully completed. Retrieved weather information for {city_count} cities")

Processing Record 1 of Set 0 | rikitea
City not found. Skipping...
Processing Record 3 of Set 0 | kahului
Processing Record 4 of Set 0 | lahaina
Processing Record 5 of Set 0 | lompoc
Processing Record 6 of Set 0 | port moresby
City not found. Skipping...
Processing Record 8 of Set 0 | ushuaia
Processing Record 9 of Set 0 | albany
Processing Record 10 of Set 0 | busselton
Processing Record 11 of Set 0 | jamestown
City not found. Skipping...
City not found. Skipping...
Processing Record 14 of Set 0 | hermanus
Processing Record 15 of Set 0 | sioux lookout
City not found. Skipping...
Processing Record 17 of Set 0 | punta arenas
Processing Record 18 of Set 0 | podgorenskiy
Processing Record 19 of Set 0 | dikson
Processing Record 20 of Set 0 | codrington
City not found. Skipping...
Processing Record 22 of Set 0 | belmonte
Processing Record 23 of Set 0 | cidreira
Processing Record 24 of Set 0 | yellowknife
City not found. Skipping...
Processing Record 26 of Set 0 | iznoski
Processing Record 2

Processing Record 9 of Set 4 | sibolga
City not found. Skipping...
Processing Record 11 of Set 4 | honiara
Processing Record 12 of Set 4 | taman
Processing Record 13 of Set 4 | pisco
Processing Record 14 of Set 4 | valavanur
Processing Record 15 of Set 4 | asfi
Processing Record 16 of Set 4 | kodinsk
Processing Record 17 of Set 4 | svetlogorsk
Processing Record 18 of Set 4 | nemuro
Processing Record 19 of Set 4 | galbshtadt
Processing Record 20 of Set 4 | narsaq
Processing Record 21 of Set 4 | davila
Processing Record 22 of Set 4 | naryan-mar
Processing Record 23 of Set 4 | praia
Processing Record 24 of Set 4 | cherskiy
Processing Record 25 of Set 4 | uyo
Processing Record 26 of Set 4 | zhuhai
Processing Record 27 of Set 4 | vila velha
Processing Record 28 of Set 4 | amuntai
Processing Record 29 of Set 4 | longyearbyen
City not found. Skipping...
City not found. Skipping...
Processing Record 32 of Set 4 | labytnangi
Processing Record 33 of Set 4 | loandjili
Processing Record 34 of Set 

In [None]:
#Create DataFrame
weather_df = pd.DataFrame({"City": cities})

weather_df["Latitude"] = ""
weather_df["Longitude"] = ""
weather_df["Max Temp"] = ""
weather_df["Humidity"] = ""
weather_df["Cloudiness"] = ""
weather_df["Wind Speed"] = ""
weather_df["Country"] = ""
weather_df["Data"] = ""

#Iterate through Cities and retrieve data
print("Begining Data Retrieval")
print("--------------------------")


#Counters for weather loop
city_count = 0
api_call_count = 1
sets = 0

for index, row in weather_df.iterrows():
    city = row["City"]
    
    #Create base url
    
    base_url = "http://api.openweathermap.org/data/2.5/weather?"
        
    #Create query url
    query_url = base_url + "appid=" + weather_api_key + "&q=" + city
    weather_response = requests.get(query_url).json()
    
    try:
        print(f"Processing Record {record} of Set {sets} | {city}.")

        weather_df.loc[index, "Country"] = weather_response["sys"]["country"]
        weather_df.loc[index, "Date"] = datetime.datetime.fronttimestamp(weather_response["dt"])
        weather_df.loc[index, "Latitude"] = weather_response["coord"]["lat"]
        weather_df.loc[index, "Longitude"] = weather_response["coord"]["lon"]
        weather_df.loc[index, "Cloudiness"] = weather_response["clouds"]["all"]
        weather_df.loc[index, "Humidity"] = weather_response["main"]["humidity"]
        weather_df.loc[index, "Max Temp"] = 1.8 * (weather_response["main"]["temp_max"] - 273) + 32
        weather_df.loc[index, "Wind Speed"] = weather_response["wind"]["speed"]
        
        city_count = city_count + 1
        
    except:
        print(f"City not found...skipping {city}.")
        api_call_count = api_call_count + 1
        
    if api_call_count == 50:
        api_call_count = 1
        sets = sets + 1

print("--------------------------")
print("Data Retrieval Complete")
print("--------------------------")

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


In [None]:
# Extract relevant fields from the data frame


# Export the City_Data into a csv


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

In [None]:
# OPTIONAL: Create a function to create Linear Regression plots

In [None]:
# Create Northern and Southern Hemisphere DataFrames

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression