# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress
from pprint import pprint

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

In [2]:
#Use ! in front of the code if you are running terminal commands
#!pip freeze 
#!pip install citipy

## Generate Cities List

In [3]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

634

In [4]:
#Just to check the cities in the list
print(cities)

['huescar', 'raudeberg', 'torbay', 'punta arenas', 'vaini', 'portland', 'yellowknife', 'majene', 'gawler', 'east london', 'saskylakh', 'ushuaia', 'flin flon', 'rikitea', 'ribeira grande', 'tsihombe', 'belushya guba', 'hilo', 'cilegon', 'sines', 'bluff', 'mar del plata', 'teguise', 'cape town', 'bargal', 'hermanus', 'avera', 'santa cruz', 'vanimo', 'ukiah', 'cabo san lucas', 'imeni zhelyabova', 'kostinbrod', 'lyubytino', 'bengkulu', 'tuatapere', 'nizhneyansk', 'manicore', 'victoria', 'lorengau', 'new norfolk', 'port alfred', 'busselton', 'taolanaro', 'emba', 'hobart', 'avarua', 'klaksvik', 'gogrial', 'chingirlau', 'mareeba', 'albany', 'kavieng', 'fasa', 'seoul', 'samarai', 'barrow', 'poum', 'sitka', 'atuona', 'khatanga', 'dunedin', 'komsomolskiy', 'joao pinheiro', 'port-gentil', 'thompson', 'tecpan', 'aksu', 'pisco', 'zhanaozen', 'talnakh', 'mataura', 'moyale', 'port elizabeth', 'emerald', 'havoysund', 'bom jesus da lapa', 'adre', 'awbari', 'lungi', 'carnarvon', 'bilsanda', 'bemidji', '

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).

> **HINT:** The OpenWeatherMap API only allows 60 calls per minute under their free plan. Try using `time.sleep(60)` after each set of 50 cities to avoid API errors due to large calls.

In [5]:
#Openweather API Calls
url = "http://api.openweathermap.org/data/2.5/weather?"
#The open weather API requires units as a parameter
unit_parameter = "imperial"

# Build partial query URL and use sample city to test
query_url_test = f"{url}appid={weather_api_key}&units={unit_parameter}&q=Knoxville"
#Commented out the display (query_url) after testing because display revealed the keys in the url
#display (query_url_test)

In [6]:
#Partial QUery from Test Section Above
query_url= f"{url}appid={weather_api_key}&units={unit_parameter}&q="
#Commented out the display (query_url) after testing because display revealed the keys in the url
#display (query_url)

In [7]:
#Creating an empty dataframe
df = pd.DataFrame(columns=['country', 'city', 'lat', 'lon', 'date', 'cloudiness', 'humidity', 'max_temp', 'wind_speed'])

display(df)

Unnamed: 0,country,city,lat,lon,date,cloudiness,humidity,max_temp,wind_speed


In [8]:
#Building the query
#I knew the query would would generate the correct results after the testing above using Knoxville.
query_url= f"{url}appid={weather_api_key}&units={unit_parameter}&q="

In [9]:
count = 1

for city in cities:
    if count % 50 == 0:
        time.sleep(60)
    try:
        print(f'Retrieving data for city {city}')
        #Get values for current city
        city_info = requests.get(query_url + city).json()
        country = city_info['sys']['country']
        date = city_info['dt']
        lat = city_info['coord']['lat']
        lon = city_info['coord']['lon']
        clouds = city_info['clouds']['all']
        humidity = city_info['main']['humidity']
        max_temp = city_info['main']['temp_max']
        wind_speed = city_info['wind']['speed']
        
        #Create a dictionary
        current_city_dict = {
            'country': country,
            'city': city,
            'lat': lat,
            'lon': lon,
            'date': date,
            'cloudiness': clouds,
            'humidity': humidity,
            'max_temp': max_temp,
            'wind_speed': wind_speed
        }
        
        #Convert dictionary to dataframe for current city
        current_city = pd.DataFrame([current_city_dict])
        
        #Concatenate main df with current city dataframe
        df = pd.concat([df, current_city]).reset_index(drop=True)
        
    except:
        print(f'Data for city {city} is not available')
    
    count+=1

Retrieving data for city huescar
Retrieving data for city raudeberg
Retrieving data for city torbay
Retrieving data for city punta arenas
Retrieving data for city vaini
Retrieving data for city portland
Retrieving data for city yellowknife
Retrieving data for city majene
Retrieving data for city gawler
Retrieving data for city east london
Retrieving data for city saskylakh
Retrieving data for city ushuaia
Retrieving data for city flin flon
Retrieving data for city rikitea
Retrieving data for city ribeira grande
Retrieving data for city tsihombe
Data for city tsihombe is not available
Retrieving data for city belushya guba
Data for city belushya guba is not available
Retrieving data for city hilo
Retrieving data for city cilegon
Retrieving data for city sines
Retrieving data for city bluff
Retrieving data for city mar del plata
Retrieving data for city teguise
Retrieving data for city cape town
Retrieving data for city bargal
Data for city bargal is not available
Retrieving data for cit

Retrieving data for city luderitz
Retrieving data for city shirokiy
Retrieving data for city cooma
Retrieving data for city saint-francois
Retrieving data for city nemuro
Retrieving data for city san pedro buenavista
Retrieving data for city tuktoyaktuk
Retrieving data for city buala
Retrieving data for city biak
Retrieving data for city aklavik
Retrieving data for city sorong
Retrieving data for city iqaluit
Retrieving data for city whitehorse
Retrieving data for city presidencia roque saenz pena
Retrieving data for city balimo
Data for city balimo is not available
Retrieving data for city acapulco
Retrieving data for city georgetown
Retrieving data for city urumqi
Retrieving data for city husavik
Retrieving data for city faya
Retrieving data for city diapaga
Retrieving data for city hauterive
Retrieving data for city east stroudsburg
Retrieving data for city hervey bay
Retrieving data for city salalah
Retrieving data for city itarema
Retrieving data for city alyangula
Retrieving data

Retrieving data for city ust-kuyga
Retrieving data for city mayor pablo lagerenza
Retrieving data for city hami
Retrieving data for city arawa
Retrieving data for city camana
Retrieving data for city madaoua
Retrieving data for city harlingen
Retrieving data for city saint-pierre
Retrieving data for city itacare
Retrieving data for city hudson bay
Retrieving data for city moberly
Retrieving data for city luanda
Retrieving data for city sunrise manor
Retrieving data for city rungata
Data for city rungata is not available
Retrieving data for city airai
Retrieving data for city cayenne
Retrieving data for city hasaki
Retrieving data for city rawannawi
Data for city rawannawi is not available
Retrieving data for city panama city
Retrieving data for city wajima
Retrieving data for city anloga
Retrieving data for city yingkou
Retrieving data for city vredendal
Retrieving data for city ranong
Retrieving data for city pandan
Retrieving data for city suhbaatar
Retrieving data for city matara
Re

In [15]:
display(df)

Unnamed: 0,country,city,lat,lon,date,cloudiness,humidity,max_temp,wind_speed
0,ES,huescar,37.8110,-2.5412,1643259221,100,91,43.93,6.40
1,NO,raudeberg,61.9875,5.1352,1643259221,100,95,43.47,5.99
2,CA,torbay,47.6666,-52.7314,1643259020,100,96,28.27,18.41
3,CL,punta arenas,-53.1500,-70.9167,1643258969,40,76,50.11,21.85
4,TO,vaini,-21.2000,-175.2000,1643259222,20,84,86.16,6.91
...,...,...,...,...,...,...,...,...,...
581,US,kahului,20.8947,-156.4700,1643261591,20,76,74.84,8.05
582,RU,kholm,59.2667,32.8500,1643261650,100,90,18.73,10.29
583,BR,ilhabela,-23.7781,-45.3581,1643261613,76,80,77.41,5.99
584,ES,aranda de duero,41.6704,-3.6892,1643261651,0,60,34.12,5.55


### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [16]:
#The solution approach I used moved variables into a dictionary and the dictionary into a pandaframe at each city iteration
#The concat option was used to stack the dataframes after the each cities dataframe from populated.

In [17]:
#Export df Dataframe with cities data to the output_data folder
df.to_csv('../output_data/cities_output.csv')


## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [13]:
#  Get the indices of cities that have humidity over 100%.


In [14]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression