# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [None]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import gmaps
import os
import json
from pprint import pprint
from scipy import stats
from scipy.stats import linregress

from citipy import citipy
from datetime import date
import scipy.stats as st


# Import API key
from api_keys import weather_api_key
from citipy import citipy



In [None]:
#create a list of lattitute and longitiutde and cities
lat_range = (-90,90)
lon_range = (-180,180)

cities = []
lat_lon = []
unique_cities = []

#import cities datafile 
cities_pd = pd.read_csv("../output_data/cities.csv")
cities_pd.head()



## Generate Cities List

In [None]:
#lat and long combination 
lat = np.random.uniform(lat_range[0], lat_range[1],size = 2000)
lon = np.random.uniform(lon_range[0], lon_range[1],size = 2000)

#map the lat and lon
lat_lon = zip(lat,lon)

#find the nearest city for a given coordinate

for coordinates in lat_lon:
    location_data = citipy.nearest_city(coordinates[0], coordinates[1])
    city = location_data.city_name
    country_name = location_data.country_code
    
    #if the location is unique add the new city into the cities list 
    if city not in unique_cities:
        unique_cities.append(city)
        cities.append(city)

print(len(cities))

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).



In [None]:
#URL
units = "metric"
url = "http://api.openweathermap.org/data/2.5/weather?"
API_url = f"{url}appid={weather_api_key}&units={units}&q="
query_url = url + "appid=" + weather_api_key + "&q="

In [None]:
#create lists to store the variable data 
lat = []
lng = []
temp = []
hum = []
cld = []
wind = []
dt =[]
city_list = []
country = []
no_data = []

In [None]:
cities

In [None]:
requests.get(query_url+'chuy').json()["coord"]["lat"]

In [None]:
#use API to scan through the dataset and insert it into the df and print a summary
number = 0
group = 1

#limit the API search so it doesn't max out


#start API run
print ("Initiate API Data Retrieval")
print ("-------------------------------")

for place in cities:
    try:
        print (f"Processing the file {number} of Group {group} | {place}.")
            
        #place the response into variables first
        response = requests.get(query_url+place).json()
        
        city_list.append(place)
        lat.append(response["coord"]["lat"])
        lng.append(response["coord"]["lon"])
        temp.append(response["main"]["temp_max"])
        hum.append(response["main"]["humidity"])
        cld.append(response["clouds"]["all"])
        wind.append(response["wind"]["speed"])
        dt.append(response["dt"])
        country.append(response["sys"]["country"])

        
    except:
        (f"Weather for the city is unavaliable, checking next city: {place}.")
        
        no_data.remove(cities)    
            
    number = number + 1
    if number == 50:
        number= 0
        group = group + 1   
        
print ("-------------------------------")
print ("API Retrieval is complete")
print(API_url)
print(f"city name: {city_list}")
print (f"The latitude information received is: {lat}")
print(f"The temperature information received is: {temp}")            

        
        

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [None]:
print (len(lng))

In [None]:



weather_by_city_dict = {"City": place, "Country": country, "Latitude": lat, "Longtitude": lng, "Max Temp": temp, "Humidity": hum, "Cloudiness": cld, "Wind Speed": wind, "Date":dt}

weather_by_city_df = pd.DataFrame(weather_by_city_dict)


weather_by_city_df

In [None]:
weather_by_city_df.to_csv("../output_data/weather_data.csv")

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

In [None]:
plt.scatter(pd.to_numeric(weather_df["Latitude"]).astype(float), pd.to_numeric(weather_df["Max Temp (F)"]).astype(float),  alpha=.5, facecolor="red", edgecolors="black", marker ="o")
plt.title(f"Latitude vs Max Temperature in F")
plt.xlabel("Latitude")
plt.ylabel("Temperature (F)") 
print(f"The max temperatures are highest near the equator.")
plt.show()

In [None]:
# Save figure to Images folder dont run this right now ##########
plt.savefig("Images/Latitude vs Temperature.png")

## Latitude vs. Humidity Plot

In [None]:
plt.scatter(pd.to_numeric(city_weather["Latitude"]).astype(float), pd.to_numeric(city_weather["Humidity (%)"]).astype(float), facecolors="skyblue", edgecolors="purple", alpha = 0.5)
plt.xlabel("Latitude")
plt.ylabel("Humidity (%)")
plt.title(f"Latitude vs Humidity as at 14/09/2021")
plt.show()

In [None]:
plt.savefig("Images/Latitude vs Humidity.png")

## Latitude vs. Cloudiness Plot

In [None]:
plt.savefig("Images/latitude_cloudiness.png")

## Latitude vs. Wind Speed Plot

In [None]:
plt.savefig("Images/latitude vs wind speed.png")

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression