# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
import api_keys

# Use citipy to find the city from its latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

#Import CSV file and read 
city_weather = pd.read_csv("../output_data/cities.csv")
city_weather.head()

Unnamed: 0,City_ID,City,Cloudiness,Country,Date,Humidity,Lat,Lng,Max Temp,Wind Speed
0,0,ostrovnoy,2,RU,1558378754,72,68.05,39.51,37.5,7.16
1,1,mahebourg,75,MU,1558378503,74,-20.41,57.7,78.8,11.41
2,2,qaanaaq,25,GL,1558378755,73,77.48,-69.36,22.2,2.37
3,3,zhuhai,0,CN,1558378755,39,40.71,112.04,44.6,4.47
4,4,cape town,20,ZA,1558378755,76,-33.93,18.42,55.99,8.05


## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lng = []
cities = []
countries = []

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

# Create a set of random lat and lng combinations
# NOTE: lat_range [0] is -90 and [1] is 90 from above

lat = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lng = np.random.uniform(lng_range[0], lng_range[1], size=1500)
locations = zip(lat, lng)

# Identify nearest city for each lat, lng combination
for lat_lng in locations:
    city_name = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # Add all unique cities to the 'city' 
    if city_name not in cities:
        cities.append(city_name)
        
print(len(cities))
cities

620


['malbork',
 'amga',
 'ushuaia',
 'stutterheim',
 'yulara',
 'port alfred',
 'dawei',
 'qaanaaq',
 'kuching',
 'rikitea',
 'shihezi',
 'souillac',
 'longyearbyen',
 'hvammstangi',
 'yangambi',
 'senador jose porfirio',
 'puerto ayora',
 'mataura',
 'norman wells',
 'ribeira grande',
 'hurghada',
 'busselton',
 'fairbanks',
 'tungkang',
 'torbay',
 'marawi',
 'mattru',
 'mehamn',
 'carnarvon',
 'bluff',
 'barrow',
 'kapaa',
 'punta arenas',
 'bathsheba',
 'jumla',
 'santa vitoria do palmar',
 'butaritari',
 'namibe',
 'albany',
 'bredasdorp',
 'nanortalik',
 'new norfolk',
 'saravan',
 'guerrero negro',
 'vaini',
 'slavsk',
 'quepos',
 'huangchuan',
 'kruisfontein',
 'taolanaro',
 'tuatapere',
 'isangel',
 'bilma',
 'muros',
 'cape town',
 'katol',
 'fortuna',
 'severo-yeniseyskiy',
 'saldanha',
 'talnakh',
 'bandundu',
 'amderma',
 'sentyabrskiy',
 'castro',
 'dunedin',
 'marcona',
 'kadykchan',
 'hobart',
 'upernavik',
 'baykit',
 'bardiyah',
 'qasigiannguit',
 'hofn',
 'iqaluit',
 's

In [7]:
# Randomly select 500 cities for weather data.

random_cities = city_weather.sample(n=500)

#Visualize the selected cities DataFrame.

random_cities

Unnamed: 0,City_ID,City,Cloudiness,Country,Date,Humidity,Lat,Lng,Max Temp,Wind Speed
13,13,saskylakh,0,RU,1558378757,91,71.97,114.09,4.92,2.26
534,534,marzuq,84,YE,1558378896,36,14.40,46.47,79.44,6.02
130,130,cravo norte,100,CO,1558378778,67,6.30,-70.20,85.02,3.09
302,302,alofi,75,NU,1558378845,94,-19.06,-169.92,75.20,6.93
243,243,buchach,75,UA,1558378822,100,49.06,25.39,70.00,2.24
...,...,...,...,...,...,...,...,...,...,...
299,299,jiuquan,0,CN,1558378844,14,39.73,98.49,59.64,5.50
223,223,koronowo,20,PL,1558378736,60,53.31,17.94,71.01,3.36
254,254,rocha,97,UY,1558378828,96,-34.48,-54.34,61.08,11.30
435,435,dong xoai,100,VN,1558378870,71,11.53,106.92,83.76,5.44


In [None]:
# OpenWeatherMap API Key
api_key = api_keys.weather_api_key

# Base URL for API Call
base_url= 'http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=' + api_key
base_url

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [None]:
# Open lists for the following columns to hold data
city = []
lats = []
lngs = []
temps = []
humidity = []
clouds = []
winds = []

# Use a counter for the script to run through
city_counter = 1

#Loop through each city, extract required items, and print result
print('''
------------------------------
City Weather Data Retrieval
------------------------------''')

# For/ try loop for city weather tables 
for city in cities:
    try:
        city_weather = (requests.get(f"{base_url}&q={city}").json()
        city.append(city_weather["name"])
        lats.append(city_weather['coord']['lat'])
        lngs.append(city_weather['coord']['lon'])
        temps.append(city_weather['main']['temp'])
        humidity.append(city_weather['main']['humidity'])
        clouds.append(city_weather['clouds']['all'])
        winds.append(city_weather['wind']['speed'])
        print(f'City number {number} of {len(cities)} complete. | Added {city}')
        
        # Continue the search until the end
        city_counter = city_counter + 1
         
    except (KeyError, IndexError):
        print(f'Missing data in city {city} | Skipping')
    continue   

print('''
------------------------------
End of City Weather Data Retrieval
------------------------------''')




### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression