# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [27]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress
import json

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy
units = "imperial"
# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [28]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

612

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [39]:
# Starting URL for Weather Map API
url = f"http://api.openweathermap.org/data/2.5/weather?appid={weather_api_key}&units={units}&q="

In [40]:
 # Creating empty lists for the dataframe
city_data = []
clouds = []
dates = []
humidity = []
lats = []
lngs = []
max_temps = []
wind_speeds = []
countries = []

# set initial count quantities for organization
record_count = 0
set_count = 1

In [41]:
# print['Beginning Data Retrieval']
# print['-----------------------------']

# loops for creating dataframe columns
for city in cities:
    try:
        response = requests.get(url + city.replace(" ","&")).json()
        clouds.append(response['clouds']['all'])
        countries.append(response['sys']['country'])
        dates.append(response['dt'])
        humidity.append(response['main']['humidity'])
        lats.append(response['coord']['lat'])
        lngs.append(response['coord']['lon'])
        max_temps.append(response['main']['temp_max'])
        wind_speeds.append(response['wind']['speed'])
        if record_count > 50:
            record_count = 1
            set_count += 1
            city_data.append(city)
        else:
            record_count += 1
            city_data.append(city)
        print(f"Processing Record {record_count} of Set {set_count} | {city}")
    except Exception:
        print("City not found. Skipping...")
print("------------------------------\nData Retrieval Complete\n------------------------------")    

Processing Record 1 of Set 1 | fortuna
Processing Record 2 of Set 1 | vostok
Processing Record 3 of Set 1 | tasiilaq
Processing Record 4 of Set 1 | port alfred
City not found. Skipping...
Processing Record 5 of Set 1 | bredasdorp
Processing Record 6 of Set 1 | bandrele
City not found. Skipping...
Processing Record 7 of Set 1 | albany
City not found. Skipping...
Processing Record 8 of Set 1 | lebu
Processing Record 9 of Set 1 | rikitea
Processing Record 10 of Set 1 | hilo
Processing Record 11 of Set 1 | pevek
Processing Record 12 of Set 1 | wewak
Processing Record 13 of Set 1 | chokurdakh
Processing Record 14 of Set 1 | haines junction
Processing Record 15 of Set 1 | san patricio
Processing Record 16 of Set 1 | guerrero negro
City not found. Skipping...
Processing Record 17 of Set 1 | east london
Processing Record 18 of Set 1 | ushuaia
Processing Record 19 of Set 1 | akyab
Processing Record 20 of Set 1 | saint-augustin
Processing Record 21 of Set 1 | corrente
Processing Record 22 of Set

Processing Record 35 of Set 4 | pacific grove
Processing Record 36 of Set 4 | georgetown
Processing Record 37 of Set 4 | saskylakh
Processing Record 38 of Set 4 | naryan-mar
Processing Record 39 of Set 4 | redmond
Processing Record 40 of Set 4 | carnarvon
Processing Record 41 of Set 4 | palu
Processing Record 42 of Set 4 | severo-kurilsk
Processing Record 43 of Set 4 | lethem
City not found. Skipping...
City not found. Skipping...
Processing Record 44 of Set 4 | ghanzi
Processing Record 45 of Set 4 | oranjemund
Processing Record 46 of Set 4 | tres arroyos
Processing Record 47 of Set 4 | lazaro cardenas
City not found. Skipping...
Processing Record 48 of Set 4 | lavrentiya
Processing Record 49 of Set 4 | inhambane
Processing Record 50 of Set 4 | bonavista
Processing Record 51 of Set 4 | cheyenne
Processing Record 1 of Set 5 | xining
Processing Record 2 of Set 5 | cabinda
Processing Record 3 of Set 5 | santiago
Processing Record 4 of Set 5 | hithadhoo
Processing Record 5 of Set 5 | barce

Processing Record 15 of Set 8 | aklavik
Processing Record 16 of Set 8 | puerto narino
Processing Record 17 of Set 8 | sosnovo-ozerskoye
Processing Record 18 of Set 8 | morro bay
Processing Record 19 of Set 8 | uruacu
Processing Record 20 of Set 8 | copertino
Processing Record 21 of Set 8 | george
Processing Record 22 of Set 8 | gaffney
Processing Record 23 of Set 8 | roald
Processing Record 24 of Set 8 | ampanihy
Processing Record 25 of Set 8 | vagay
Processing Record 26 of Set 8 | tommot
Processing Record 27 of Set 8 | iqaluit
Processing Record 28 of Set 8 | yabelo
Processing Record 29 of Set 8 | tucurui
Processing Record 30 of Set 8 | port macquarie
Processing Record 31 of Set 8 | carlos antonio lopez
Processing Record 32 of Set 8 | grenville
Processing Record 33 of Set 8 | dubuque
Processing Record 34 of Set 8 | riesa
Processing Record 35 of Set 8 | akdepe
Processing Record 36 of Set 8 | chubbuck
Processing Record 37 of Set 8 | constitucion
Processing Record 38 of Set 8 | omsukchan


### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [43]:
#Creating a dictionary to display the the data frame in rows and columns; 

dict_weather = {
    "City":city_data,
    "Clouds":clouds,
    "Country":countries,
    "Date":dates,
    "Humidity":humidity,
    "Lat":lats,
    "Lng":lngs,
    "Max Temp":max_temps,
    "Wind Speed":wind_speeds
}

In [13]:
# establish dataframe
display_weather = pd.DataFrame(dict_weather)
display_weather.head()

Unnamed: 0,City,Clouds,Country,Date,Humidity,Lat,Lng,Max Temp,Wind Speed
0,thomasville,70,US,1650586696,71,35.8826,-80.082,66.29,3.6
1,digby,100,CA,1650586836,69,44.6169,-65.7655,44.58,14.09
2,mys shmidta,29,RU,1650586836,97,62.0589,48.6201,23.74,1.36
3,cotonou,95,BJ,1650586728,78,6.3654,2.4183,81.57,3.11
4,punta arenas,64,PH,1650586837,74,8.9897,125.34,81.86,5.7


In [14]:
# # output data to csv
# weather_dataframe.to_csv(output_data_file)

In [15]:
weather_dataframe.count()

City          550
Clouds        550
Country       550
Date          550
Humidity      550
Lat           550
Lng           550
Max Temp      550
Wind Speed    550
dtype: int64

In [17]:
weather_dataframe.describe()

Unnamed: 0,Clouds,Date,Humidity,Lat,Lng,Max Temp,Wind Speed
count,550.0,550.0,550.0,550.0,550.0,550.0,550.0
mean,62.858182,1650587000.0,72.154545,22.718993,23.321327,60.617164,7.659891
std,36.235541,87.58971,22.2284,31.604035,88.772071,21.044026,5.650798
min,0.0,1650586000.0,9.0,-54.8,-175.2,-11.87,0.0
25%,29.0,1650587000.0,61.25,-3.08425,-49.92685,47.19,3.33
50%,75.0,1650587000.0,78.0,25.35155,27.78295,64.79,6.03
75%,98.0,1650587000.0,89.0,49.054475,100.349575,78.3075,10.51
max,100.0,1650587000.0,100.0,78.2186,179.3167,97.57,35.99


## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression