# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [11]:
##pip install citipy==0.0.5

Note: you may need to restart the kernel to use updated packages.


In [4]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
import json 
from pandas.io.json import json_normalize

from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

611

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [8]:
city_names = []
lat = []
lon =[]
max_temp = []
humidity = []
cloudiness = []
wind_speed = []
country = []
date = []

print('Beginning Data Retrieval ')
print('----------------------')
record = 1
for city in cities:
    url = f"http://api.openweathermap.org/data/2.5/weather?q={city}&appid={weather_api_key}"
    response = requests.get(url).json()
    try:
        city_names.append(response['name'])
        lat.append(response['coord']['lat'])
        lon.append(response['coord']['lon'])
        max_temp.append(response['main']['temp_max'])
        humidity.append(response['main']['humidity'])
        cloudiness.append(response['clouds']['all'])
        wind_speed.append(response['wind']['speed'])
        country.append(response['sys']['country'])
        date.append(response['dt']) 
        print(f'processing record {record} | {city}')
        record +=1 
        time.sleep(1.1)
    except:
        print ('city not found skipping....')

Beginning Data Retrieval 
----------------------
processing record 1 | cascais
processing record 2 | bluff
processing record 3 | majene
processing record 4 | bathsheba
city not found skipping....
city not found skipping....
processing record 5 | barrow
processing record 6 | albany
processing record 7 | mataura
processing record 8 | hermanus
processing record 9 | saint-philippe
processing record 10 | nisia floresta
processing record 11 | provideniya
processing record 12 | henties bay
city not found skipping....
processing record 13 | bredasdorp
processing record 14 | poso
processing record 15 | kaitangata
processing record 16 | makakilo city
processing record 17 | gambela
processing record 18 | mae sot
processing record 19 | leningradskiy
processing record 20 | rikitea
processing record 21 | busselton
processing record 22 | hithadhoo
processing record 23 | tatarsk
processing record 24 | ushuaia
processing record 25 | grand gaube
processing record 26 | saldanha
processing record 27 | bar

processing record 231 | bayonne
processing record 232 | naze
processing record 233 | faya
city not found skipping....
processing record 234 | srednekolymsk
city not found skipping....
processing record 235 | san carlos de bariloche
city not found skipping....
processing record 236 | carnarvon
processing record 237 | dawei
processing record 238 | tiksi
processing record 239 | brae
processing record 240 | nojorid
processing record 241 | dikson
processing record 242 | romny
city not found skipping....
processing record 243 | chama
processing record 244 | kavaratti
processing record 245 | dudinka
city not found skipping....
processing record 246 | gisborne
processing record 247 | araceli
processing record 248 | jinchang
processing record 249 | murdochville
processing record 250 | khawhai
processing record 251 | dubai
processing record 252 | paamiut
processing record 253 | changji
processing record 254 | sulejowek
processing record 255 | kota bahru
processing record 256 | mgachi
processing 

processing record 460 | riyadh
processing record 461 | vardo
processing record 462 | shakawe
processing record 463 | alofi
city not found skipping....
processing record 464 | kozelsk
processing record 465 | filingue
city not found skipping....
processing record 466 | uruzgan
processing record 467 | itarema
processing record 468 | deputatskiy
processing record 469 | hualmay
processing record 470 | mandalgovi
processing record 471 | ejea de los caballeros
processing record 472 | lensk
processing record 473 | nizwa
processing record 474 | dwarka
processing record 475 | la ronge
city not found skipping....
processing record 476 | reichenau
processing record 477 | atessa
processing record 478 | yanam
city not found skipping....
processing record 479 | priargunsk
processing record 480 | tatawin
processing record 481 | el jicaro
processing record 482 | port blair
city not found skipping....
processing record 483 | augustow
processing record 484 | palmer
processing record 485 | bambanglipuro
p

In [10]:
df = pd.DataFrame({'city': city_names, 'date': date, 'latitude': lat, 'Longitutude': lon, 'maximum Temperature': max_temp, 'Humidity': humidity, 'Cloudiness': cloudiness, 'Wind Speed': wind_speed, 'Country': country, 'Date': date})
df

Unnamed: 0,city,date,latitude,Longitutude,maximum Temperature,Humidity,Cloudiness,Wind Speed,Country,Date
0,Cascais,1605902846,38.70,-9.42,292.59,55,0,3.10,PT,1605902846
1,Bluff,1605902846,-46.60,168.33,290.93,59,59,7.15,NZ,1605902846
2,Majene,1605902997,-3.54,118.97,298.78,83,100,1.55,ID,1605902997
3,Bathsheba,1605902998,13.22,-59.52,300.15,83,75,5.10,BB,1605902998
4,Barrow,1605902999,71.29,-156.79,259.15,77,20,6.70,US,1605902999
...,...,...,...,...,...,...,...,...,...,...
558,Belvedere Marittimo,1605903657,39.62,15.86,286.48,99,100,4.37,IT,1605903657
559,Poronaysk,1605903658,49.22,143.12,267.02,88,100,2.70,RU,1605903658
560,Sola,1605903659,-13.88,167.55,298.91,80,99,2.08,VU,1605903659
561,Reconquista,1605903660,-29.15,-59.65,301.75,29,0,1.62,AR,1605903660


In [16]:
# Save Data to csv
df.to_csv("Weather_part1.csv")



## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [18]:
for city in cities:
    filter_df = df.loc[df["Humidity"]> 100]
    filter_df = filter_df.drop(["city"])

KeyError: "['city'] not found in axis"

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression