# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
#dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
import datetime
from scipy.stats import linregress

#import API key
from api_keys import weather_api_key

#import citipy to determine city based on latitude and longitude
from citipy import citipy

#import geopy to find country based on latitude and longitude
from geopy.geocoders import Nominatim

#output to File (CSV)
output_data_file = "output_data/cities.csv"

#range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [2]:
#list for holding lat/lng and cities
lat_lngs = []
cities = []

#create a set of random lat and lng combinations, zip into one list variable
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)


#identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    #if the city is not already in our cities list, add it
    if city not in cities:
        cities.append(city)

#print the city count to confirm sufficient count
len(cities)

625

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [4]:

url = 'http://api.openweathermap.org/data/2.5/weather?units=imperial&appid=' + weather_api_key + '&q=' 

cityData = []
cityDataStats = []
set_count = 1 #group
record = 1 #record within group

print(f'Beginning Data Retrieval')
print(f'----------------------------')

for i, city in enumerate(cities):
    if(i % 50 == 0 and i >= 50):
        set_count += 1 #make new group
        record = 0 #reset records in the group 
        
#output record and group being processed
    print(f'processing record {record} of set {set_count} | {city}')       
     
    record += 1
    
    cityurl = url + city
    try:
        cityWeather = requests.get(cityurl).json()
        lat = cityWeather['coord']['lat']
        lon = cityWeather['coord']['lon']
        maxTemp = cityWeather['main']['temp_max']
        humidity = cityWeather['main']['humidity']
        cloudiness = cityWeather['clouds']['all']
        windSpeed = cityWeather['wind']['speed']
        date = cityWeather['dt']
        timestamp = datetime.datetime.fromtimestamp(date)
        dateConvert = timestamp.strftime('%m-%d-%Y At %H:%M:%S')
        geolocator = Nominatim(user_agent="python_api_project")
        location = geolocator.reverse(str(lat)+","+str(lon))
        address = location.raw['address']
        country_code = address.get('country_code').upper()
        
        cityData.append({'City':city, 'Lat':round(lat, 2), 'Lng':round(lon, 2), 'Max Temp': str(maxTemp) + ' F', 
                         'Humidity':str(humidity) + '%', 'Cloudiness':str(cloudiness) + '%', 'Wind Speed':str(windSpeed) + ' MPH',
                        'Country': country_code, 'Date':dateConvert})
        cityDataStats.append({'Lat':lat, 'Lng':lon, 'Max Temp': maxTemp, 
                         'Humidity':humidity, 'Cloudiness':cloudiness, 'Wind Speed':windSpeed,
                        'Date':date})

        
        

    except:
        print(f'{city} not found. Skipping...')
     
    if (i == 19):
        break

Beginning Data Retrieval
----------------------------
processing record 1 of set 1 | bluff
processing record 2 of set 1 | nurota
processing record 3 of set 1 | margate
processing record 4 of set 1 | beringovskiy
processing record 5 of set 1 | cape town
processing record 6 of set 1 | buchanan
processing record 7 of set 1 | olafsvik
processing record 8 of set 1 | vaini
processing record 9 of set 1 | castro
processing record 10 of set 1 | geraldton
processing record 11 of set 1 | rikitea
processing record 12 of set 1 | punta arenas
processing record 13 of set 1 | karakendzha
karakendzha not found. Skipping...
processing record 14 of set 1 | karia
processing record 15 of set 1 | creel
processing record 16 of set 1 | qaanaaq
processing record 17 of set 1 | marzuq
processing record 18 of set 1 | malatya
processing record 19 of set 1 | hithadhoo
processing record 20 of set 1 | chokurdakh


### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [5]:
cityData_pd = pd.DataFrame(cityData)
cityData_pd.head()

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,bluff,-46.6,168.33,45 F,95%,25%,1.99 MPH,NZ,04-23-2021 At 08:37:14
1,nurota,40.56,65.69,69.8 F,23%,36%,4.61 MPH,UZ,04-23-2021 At 08:46:52
2,margate,51.38,1.39,52 F,55%,0%,4 MPH,GB,04-23-2021 At 08:41:41
3,beringovskiy,63.05,179.32,14.59 F,87%,98%,6.33 MPH,RU,04-23-2021 At 08:36:36
4,cape town,-33.93,18.42,68 F,60%,0%,10.36 MPH,ZA,04-23-2021 At 08:37:09


In [6]:
cityDataStats_pd = pd.DataFrame(cityDataStats)
cityDataStats_pd.describe(datetime_is_numeric=True)

Unnamed: 0,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Date
count,19.0,19.0,19.0,19.0,19.0,19.0,19.0
mean,12.321684,11.711705,58.231579,63.842105,43.947368,7.152632,1619192000.0
std,42.022361,100.034385,27.693145,29.37925,41.515022,5.781142,282.4286
min,-53.15,-175.2,-13.5,11.0,0.0,1.14,1619192000.0
25%,-23.9557,-59.68755,45.7,47.5,1.5,3.375,1619192000.0
50%,11.7306,11.1629,68.0,71.0,27.0,5.23,1619192000.0
75%,45.97135,69.38595,74.725,89.5,92.5,8.825,1619193000.0
max,77.484,179.3167,101.98,99.0,100.0,20.4,1619193000.0


## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#get the indices of cities that have humidity over 100%.
cityDataClean_pd = cityData_pd
for i, city in enumerate(cities):
    url = 'http://api.openweathermap.org/data/2.5/weather?units=imperial&appid=' + weather_api_key + '&q='
    cityurl = url + city
    try:
        cityWeather = requests.get(cityurl).json()
        if((cityWeather['main']['humidity']) > 100):
            cityDataClean.drop(i, axis=0)
    except:
        print('Humidity data not retrievable. Skipping...')
cityDataClean_pd.head()
        

Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity data not retrievable. Skipping...
Humidity da

In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression