# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key


# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

# Chosing IMPERIAL due to the exercise is in Fahrenheit
units = "imperial"

# Print the URL for the Open Weather API
url = "http://api.openweathermap.org/data/2.5/weather?"
query_url = f"{url}appid={weather_api_key}&units={units}&q="
query_url

'http://api.openweathermap.org/data/2.5/weather?appid=965010596c72e3ffae1f9da4fdaa87ed&units=imperial&q='

## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

622

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [3]:
# Initial print as asked in the result.

print('''Beginning Data Retrieval     
-----------------------------''')

# Declare variables would be used in the loop.

record_num = 0                   # The result has the structure "Processing Record *1* of Set 1". Change each iteration.
record_set = 1                   # The result has the structure "Processing Record 1 of Set *1*". Change each set of 50.
city_result = []                 # Variabes would be concatenate in a list to make the Data Frame (lat/tem/hum/cloud/wind)  

# Loop for save the iteration of each response.
# Here is an example of how data looks in API: http://api.openweathermap.org/data/2.5/weather?appid=965010596c72e3ffae1f9da4fdaa87ed&units=imperial&q=ostrovnoy

for city in cities:
    city_url = query_url + city                   # Add to the URL the city save in cities, taken randomly for step before.
    weather_response = requests.get(city_url)    # Declare a JSON to read the API
    weather_json = weather_response.json()

    try:                         # Using try to jump error, in case the city do not contain the paramters.
        record_num += 1          # Each iteration would add a number. Ex. Record 1, 2 , 3,...
        latitude = weather_json["coord"]["lat"]        # Take for the JSON the parameter "lat" wichi is inside the main "coord"
        longitude = weather_json["coord"]["lon"]
        max_temp = weather_json["main"]["temp_max"]
        humidity = weather_json["main"]["humidity"]
        cloudiness = weather_json["clouds"]["all"]
        wind_speed = weather_json["wind"]["speed"]
        country = weather_json["sys"]["country"]
        date = weather_json["dt"]
        
        # Use APPEND to concatenate all the info got it above
        city_result.append({"City":city, "Lat": latitude, "Lng" : longitude, "Max Temp": max_temp, 
                            "Humidity": humidity, "Cloudiness":  cloudiness, "Wind Speed": wind_speed, 
                            "Country": country, "Date": date})
        
        print(f"Processing Record {record_num} of Set {record_set} | {city}")
        
    except KeyError:
        print("City not found.Skipping...")
        
    # Declare limits to jump to the next set of information. As example, maximum iteration is 50 by set.
    if record_num == 50:
        record_set += 1
        record_num = 0
        time.sleep(10)         # Giving time space between sets to avoid errors
            
print('''-----------------------------
Data Retrieval Complete      
-----------------------------''')    

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | san quintin
Processing Record 2 of Set 1 | ushuaia
Processing Record 3 of Set 1 | leningradskiy
Processing Record 4 of Set 1 | omboue
City not found.Skipping...
City not found.Skipping...
Processing Record 7 of Set 1 | dutlwe
Processing Record 8 of Set 1 | port alfred
Processing Record 9 of Set 1 | mahebourg
Processing Record 10 of Set 1 | quelimane
Processing Record 11 of Set 1 | victoria
Processing Record 12 of Set 1 | dikson
Processing Record 13 of Set 1 | hermanus
Processing Record 14 of Set 1 | okha
Processing Record 15 of Set 1 | ginda
Processing Record 16 of Set 1 | okakarara
City not found.Skipping...
Processing Record 18 of Set 1 | deputatskiy
Processing Record 19 of Set 1 | san cristobal
Processing Record 20 of Set 1 | north mankato
Processing Record 21 of Set 1 | koulikoro
Processing Record 22 of Set 1 | takab
Processing Record 23 of Set 1 | atuona
Processing Record 24 of Set 1 | busse

Processing Record 5 of Set 5 | amarwara
Processing Record 6 of Set 5 | kindu
City not found.Skipping...
Processing Record 8 of Set 5 | nome
Processing Record 9 of Set 5 | san andres
Processing Record 10 of Set 5 | alexandria
Processing Record 11 of Set 5 | harrisburg
Processing Record 12 of Set 5 | matagami
Processing Record 13 of Set 5 | klaksvik
Processing Record 14 of Set 5 | isilkul
Processing Record 15 of Set 5 | beyneu
Processing Record 16 of Set 5 | kununurra
Processing Record 17 of Set 5 | loreto
Processing Record 18 of Set 5 | bairiki
Processing Record 19 of Set 5 | nyeri
Processing Record 20 of Set 5 | rio grande
Processing Record 21 of Set 5 | chagoda
Processing Record 22 of Set 5 | xiuyan
Processing Record 23 of Set 5 | peringat
City not found.Skipping...
Processing Record 25 of Set 5 | dong hoi
Processing Record 26 of Set 5 | merauke
Processing Record 27 of Set 5 | kalnibolotskaya
Processing Record 28 of Set 5 | pevek
Processing Record 29 of Set 5 | oktyabrskoye
Processing

Processing Record 12 of Set 9 | pangody
Processing Record 13 of Set 9 | canavieiras
Processing Record 14 of Set 9 | mumbwa
Processing Record 15 of Set 9 | nishihara
Processing Record 16 of Set 9 | sorong
City not found.Skipping...
Processing Record 18 of Set 9 | shwebo
Processing Record 19 of Set 9 | saint anthony
Processing Record 20 of Set 9 | kedrovyy
Processing Record 21 of Set 9 | sechura
Processing Record 22 of Set 9 | cabo san lucas
City not found.Skipping...
Processing Record 24 of Set 9 | christchurch
Processing Record 25 of Set 9 | surgana
Processing Record 26 of Set 9 | yumen
Processing Record 27 of Set 9 | savannah bight
Processing Record 28 of Set 9 | coahuayana
Processing Record 29 of Set 9 | karasuk
Processing Record 30 of Set 9 | kirksville
Processing Record 31 of Set 9 | bubanza
Processing Record 32 of Set 9 | ternate
City not found.Skipping...
City not found.Skipping...
Processing Record 35 of Set 9 | yulara
Processing Record 36 of Set 9 | pringsewu
Processing Record 

Processing Record 13 of Set 13 | ambon
Processing Record 14 of Set 13 | itarema
Processing Record 15 of Set 13 | okhotsk
Processing Record 16 of Set 13 | nong khai
Processing Record 17 of Set 13 | sakakah
City not found.Skipping...
Processing Record 19 of Set 13 | santa rosa
Processing Record 20 of Set 13 | barinas
Processing Record 21 of Set 13 | bon accord
Processing Record 22 of Set 13 | pinega
-----------------------------
Data Retrieval Complete      
-----------------------------


### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [5]:
# Create a Data Frame - in this case is not necessary to clean, in case use dropna()

weather_result = pd.DataFrame(city_result)
weather_result

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,san quintin,30.4833,-115.9500,58.98,76,21,15.39,MX,1619228845
1,ushuaia,-54.8000,-68.3000,42.80,93,75,13.80,AR,1619228755
2,leningradskiy,69.3833,178.4167,29.35,85,96,5.66,RU,1619228846
3,omboue,-1.5746,9.2618,77.45,91,100,3.27,GA,1619228846
4,dutlwe,-23.9833,23.9000,60.60,36,0,6.04,BW,1619228846
...,...,...,...,...,...,...,...,...,...
563,sakakah,29.9697,40.2064,75.20,13,0,10.36,SA,1619229163
564,santa rosa,14.3122,121.1114,89.01,66,20,5.75,PH,1619229163
565,barinas,8.6226,-70.2075,82.40,65,17,1.14,VE,1619229164
566,bon accord,53.8335,-113.4187,37.40,35,75,4.61,CA,1619229164


In [7]:
# Save dataframe in output_data file.

weather_result.to_csv("output_data/weather_city_data.csv", index=False, header=True)


In [8]:
# Use fucntion .describe to show the metrics for the Data Frame

weather_result.describe()

Unnamed: 0,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Date
count,568.0,568.0,568.0,568.0,568.0,568.0,568.0
mean,19.5438,14.96984,60.638415,67.808099,54.408451,7.835,1619229000.0
std,33.064347,91.820755,19.189151,23.256794,39.799126,5.08319,122.8937
min,-54.8,-179.1667,9.88,6.0,0.0,0.45,1619228000.0
25%,-7.612,-69.52915,44.6,55.0,11.0,4.445,1619229000.0
50%,22.29275,25.43505,62.69,73.0,64.0,6.845,1619229000.0
75%,47.706575,95.41665,78.01,86.25,94.25,10.36,1619229000.0
max,78.2186,179.3167,92.89,100.0,100.0,32.73,1619229000.0


## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression