# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from datetime import datetime
from scipy.stats import linregress
import scipy.stats as st

# Import API key
import config_from_pydata_env

weather_api_key = config_from_pydata_env.weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

622

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [3]:
# url for openweather api
url = "http://api.openweathermap.org/data/2.5/weather?"
units = "imperial"

# build query url
query_url = f"{url}appid={weather_api_key}&units={units}&q="
#query_url = url + "appid=" + weather_api_key + "&q=" + city

In [4]:
# empty lists to hold query information
lat = []
temp = []
temp_max = []
humidity = []
wind_speed = []
lon = []
date = []
country = []
cloudiness = []


# loop through list of cities and request information
count = 0
set = 1
for city in cities:
    count = count + 1
    # using sleep here to not reach api limit
    if count == 51:
        count = 1
        set = set + 1
        time.sleep(5)
    print(f"Processing Record {count} of Set {set} | {city}")
    try:
        response = requests.get(query_url + city).json()
        lat.append(response['coord']['lat'])
        lon.append(response['coord']['lon'])
        temp.append(response['main']['temp'])
        temp_max.append(response['main']['temp_max'])
        humidity.append(response['main']['humidity'])
        wind_speed.append(response['wind']['speed'])
        date.append(response['dt'])
        country.append(response['sys']['country'])
        cloudiness.append(response['clouds']['all'])
    except:
        print("City not found. Skipping...")
        lat.append(np.nan)
        lon.append(np.nan)
        temp.append(np.nan)
        temp_max.append(np.nan)
        humidity.append(np.nan)
        wind_speed.append(np.nan)
        date.append(np.nan)
        country.append(np.nan)
        cloudiness.append(np.nan)
    continue
print("Data Retrieval Complete")

Processing Record 1 of Set 1 | castro
Processing Record 2 of Set 1 | maragogi
Processing Record 3 of Set 1 | marzuq
Processing Record 4 of Set 1 | dikson
Processing Record 5 of Set 1 | georgetown
Processing Record 6 of Set 1 | busselton
Processing Record 7 of Set 1 | cape town
Processing Record 8 of Set 1 | kudahuvadhoo
Processing Record 9 of Set 1 | roma
Processing Record 10 of Set 1 | rikitea
Processing Record 11 of Set 1 | ponta do sol
Processing Record 12 of Set 1 | norman wells
Processing Record 13 of Set 1 | krasnoarmeyskiy
Processing Record 14 of Set 1 | amalfi
Processing Record 15 of Set 1 | east london
Processing Record 16 of Set 1 | cidreira
Processing Record 17 of Set 1 | hithadhoo
Processing Record 18 of Set 1 | ketchikan
Processing Record 19 of Set 1 | lebu
Processing Record 20 of Set 1 | ushuaia
Processing Record 21 of Set 1 | ukiah
Processing Record 22 of Set 1 | mataura
Processing Record 23 of Set 1 | qaanaaq
Processing Record 24 of Set 1 | ponta delgada
Processing Reco

Processing Record 43 of Set 4 | kahului
Processing Record 44 of Set 4 | katsuura
Processing Record 45 of Set 4 | melton
Processing Record 46 of Set 4 | ziway
Processing Record 47 of Set 4 | half moon bay
Processing Record 48 of Set 4 | balikpapan
Processing Record 49 of Set 4 | puerto colombia
Processing Record 50 of Set 4 | rungata
City not found. Skipping...
Processing Record 1 of Set 5 | tsihombe
City not found. Skipping...
Processing Record 2 of Set 5 | tocopilla
Processing Record 3 of Set 5 | okha
Processing Record 4 of Set 5 | san patricio
Processing Record 5 of Set 5 | barrow
Processing Record 6 of Set 5 | pascagoula
Processing Record 7 of Set 5 | yaan
Processing Record 8 of Set 5 | waddan
Processing Record 9 of Set 5 | luderitz
Processing Record 10 of Set 5 | mys shmidta
City not found. Skipping...
Processing Record 11 of Set 5 | jiroft
City not found. Skipping...
Processing Record 12 of Set 5 | port macquarie
Processing Record 13 of Set 5 | kalabo
Processing Record 14 of Set 5

Processing Record 32 of Set 8 | falkoping
City not found. Skipping...
Processing Record 33 of Set 8 | gimli
Processing Record 34 of Set 8 | fonte boa
Processing Record 35 of Set 8 | laguna
Processing Record 36 of Set 8 | victoria
Processing Record 37 of Set 8 | abu samrah
Processing Record 38 of Set 8 | fare
Processing Record 39 of Set 8 | sao felix do xingu
Processing Record 40 of Set 8 | fort nelson
Processing Record 41 of Set 8 | tecoanapa
Processing Record 42 of Set 8 | gondanglegi
Processing Record 43 of Set 8 | port blair
Processing Record 44 of Set 8 | okhotsk
Processing Record 45 of Set 8 | hovd
Processing Record 46 of Set 8 | nara
Processing Record 47 of Set 8 | galle
Processing Record 48 of Set 8 | nanortalik
Processing Record 49 of Set 8 | jalu
Processing Record 50 of Set 8 | artyk
City not found. Skipping...
Processing Record 1 of Set 9 | chipiona
Processing Record 2 of Set 9 | mrirt
City not found. Skipping...
Processing Record 3 of Set 9 | siocon
Processing Record 4 of Se

City not found. Skipping...
Processing Record 22 of Set 12 | angra
City not found. Skipping...
Processing Record 23 of Set 12 | el dorado
Processing Record 24 of Set 12 | kangaatsiaq
Processing Record 25 of Set 12 | palabuhanratu
City not found. Skipping...
Processing Record 26 of Set 12 | korla
Processing Record 27 of Set 12 | koboldo
City not found. Skipping...
Processing Record 28 of Set 12 | caxias
Processing Record 29 of Set 12 | aguai
Processing Record 30 of Set 12 | juybar
Processing Record 31 of Set 12 | cairns
Processing Record 32 of Set 12 | palmer
Processing Record 33 of Set 12 | uhlove
Processing Record 34 of Set 12 | staromaryevka
City not found. Skipping...
Processing Record 35 of Set 12 | gornopravdinsk
Processing Record 36 of Set 12 | magistralnyy
Processing Record 37 of Set 12 | yagodnoye
Processing Record 38 of Set 12 | hofn
Processing Record 39 of Set 12 | tobol
Processing Record 40 of Set 12 | lasa
Processing Record 41 of Set 12 | emmett
Processing Record 42 of Set 

In [5]:
len(lat)

622

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [6]:
# convert raw data to dataframe
city_weather_df = pd.DataFrame({
    "City": cities,
    "Lat": lat,
    "Lng": lon,
    "Max Temp": temp_max,
    "Humidity": humidity,
    "Cloudiness": cloudiness,
    "Wind Speed": wind_speed,
    "Country": country,
    "Date": date,
})

# drop cities that were skipped because they could not be found by the api
city_weather_df = city_weather_df.dropna(how="any")

In [7]:
# export the city data into a .csv file within a folder named output_data
city_weather_df.to_csv("./output_data/city_weather_data.csv", index=False)

# display the dataframe
city_weather_df

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,castro,-24.79,-50.01,79.16,52.0,50.0,3.20,BR,1.603206e+09
1,maragogi,-9.01,-35.22,81.86,63.0,25.0,10.71,BR,1.603206e+09
2,marzuq,14.40,46.47,77.95,17.0,14.0,9.04,YE,1.603207e+09
3,dikson,73.51,80.55,21.61,95.0,91.0,10.29,RU,1.603206e+09
4,georgetown,5.41,100.34,84.20,83.0,20.0,3.36,MY,1.603206e+09
...,...,...,...,...,...,...,...,...,...
615,stornoway,58.21,-6.39,51.80,93.0,75.0,18.34,GB,1.603206e+09
616,bara,10.37,10.73,93.20,32.0,20.0,11.41,NG,1.603207e+09
617,kavaratti,10.57,72.64,81.81,72.0,100.0,10.11,IN,1.603207e+09
618,olafsvik,64.89,-23.71,36.88,91.0,100.0,10.92,IS,1.603206e+09


## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [8]:
#  Get the indices of cities that have humidity over 100%.


In [9]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression