# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [9]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [10]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

621

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [11]:
# Save config information


# Build query URL
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

cloudiness = []
country = []
date = []
max_temp = []
humidity = []
lat = []
lng = []
wind_speed = []
city_name = []



### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [12]:
counter = 1
sets = 0
t0 = time.time()
error = 0
cities_temp = cities
i = 1
for city in cities_temp:
    time.sleep(1)
    city=city
    query_url = url + "&q=" + city.replace(" ", "+")
    weather_response = requests.get(query_url).json()


    try: 
        cloudiness.append(weather_response["clouds"]["all"])
        country.append(weather_response["sys"]["country"])
        date.append(weather_response["dt"])
        max_temp.append(weather_response["main"]['temp_max'])
        humidity.append(weather_response["main"]['humidity'])
        lat.append(weather_response["coord"]["lat"])  
        lng.append(weather_response["coord"]["lon"])
        wind_speed.append(weather_response["wind"]["speed"])
        city_name.append(weather_response["name"])
        print(f"processing record {i} | {city}")
        i+=1
    except:
        print(f"Data for this {city} Not Found")
        pass

print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")


processing record 1 | mataura
processing record 2 | hobart
processing record 3 | togur
processing record 4 | hofn
processing record 5 | urucui
processing record 6 | husavik
processing record 7 | solnechnyy
processing record 8 | black river
processing record 9 | lompoc
processing record 10 | haapiti
processing record 11 | sitka
processing record 12 | ushuaia
processing record 13 | nanortalik
processing record 14 | cape town
processing record 15 | codrington
Data for this sentyabrskiy Not Found
processing record 16 | salta
processing record 17 | kapaa
processing record 18 | tateyama
processing record 19 | drovyanaya
processing record 20 | hithadhoo
processing record 21 | busselton
processing record 22 | iqaluit
processing record 23 | new norfolk
processing record 24 | vanimo
processing record 25 | punta arenas
processing record 26 | oistins
processing record 27 | puerto ayora
processing record 28 | kodiak
processing record 29 | vao
processing record 30 | aljezur
processing record 31 | po

In [13]:
cities_df = pd.DataFrame({
    "cloudiness": cloudiness,
    "country": country,
    "date": date,
    "max_temp": max_temp,
    "lat": lat,
    "lng": lng,
    "wind_speed": wind_speed,
    "city_name": city_name
})
cities_df.to_csv("openweathermaps.csv",index=False)
cities_df


Unnamed: 0,cloudiness,country,date,max_temp,lat,lng,wind_speed,city_name
0,11,NZ,1631672003,51.48,-46.1927,168.8643,5.93,Mataura
1,75,AU,1631671761,54.05,-42.8794,147.3294,1.99,Hobart
2,100,RU,1631672005,40.08,58.3631,82.8265,4.85,Togur
3,100,IS,1631671972,51.31,64.2539,-15.2082,16.15,Hofn
4,40,BR,1631672008,84.25,-7.2294,-44.5561,5.53,Uruçuí
...,...,...,...,...,...,...,...,...
565,38,ET,1631672811,53.67,12.6000,37.4667,4.76,Gonder
566,67,GT,1631672812,68.83,14.2258,-90.4742,2.48,Pueblo Nuevo Viñas
567,100,PA,1631672813,80.33,9.5167,-79.0333,2.68,Tubualá
568,5,GF,1631672815,78.04,5.6592,-53.7767,8.19,Mana


## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [14]:
#  Get the indices of cities that have humidity over 100%.


In [15]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression