# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [7]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key
units = "imperial"

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)


# url information
url = "http://api.openweathermap.org/data/2.5/weather?"
weather_url = f"{url}appid={weather_api_key}&units={units}&q={city}"

## Generate Cities List

In [8]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(low=-90.00, high=90.00, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)
cities

['lubango',
 'shimoda',
 'kaitangata',
 'cape town',
 'albany',
 'bato',
 'hilo',
 'puerto ayora',
 'torbay',
 'kapaa',
 'rafiganj',
 'lushunkou',
 'teresina',
 'havre-saint-pierre',
 'nizhneyansk',
 'acari',
 'palaikastron',
 'caravelas',
 'ormstown',
 'chinna salem',
 'kununurra',
 'taolanaro',
 'port elizabeth',
 'hermanus',
 'hobart',
 'atuona',
 'muroto',
 'punta arenas',
 'port angeles',
 'lira',
 'ushuaia',
 'qaanaaq',
 'provideniya',
 'umzimvubu',
 'iwanai',
 'port hardy',
 'te anau',
 'katsuura',
 'flinders',
 'sabha',
 'bethel',
 'hasaki',
 'lensk',
 'busselton',
 'bonthe',
 'bilibino',
 'arraial do cabo',
 'mpika',
 'saint-philippe',
 'malwan',
 'dikson',
 'mataura',
 'pevek',
 'marabba',
 'upernavik',
 'ambodifototra',
 'rikitea',
 'ponta do sol',
 'yellowknife',
 'tura',
 'viedma',
 'sentyabrskiy',
 'coquimbo',
 'jiaonan',
 'kodiak',
 'yining',
 'khatanga',
 'gayny',
 'payson',
 'chuy',
 'barentsburg',
 'kahului',
 'sao filipe',
 'rocha',
 'lazarev',
 'nikolskoye',
 'butar

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [None]:
#lists 
longitude =  []
latitude = []
humidity = []
temp_max = []
wind = []
clouds = []
date = []
country = []
city_name = []

#count variables
count_one = 1
set_one = 1

#loops
for city in cities:
    try:
        response =requests.get(url).json()
        print(f"Processing Record {count_one} of Set {set_one} | {city.title()}")
        longitude.append(response["coord"]["lon"])
        latitude.append(response["coord"]["lat"])
        humidity.append(response["main"]["humidity"])
        temp_max.append(response["main"]["temp_max"])
        wind.append(response["wind"]["speed"])
        clouds.append(response["clouds"]["all"])
        date.append(response["dt"])
        country.append(response["sys"]["country"])
        city_name.append(response["name"])
    except:
        print("City not found. Skipping...")
    
    count_one += 1
    if count_one == 49:
        count_one = 1
        set_one += 1
print("------------------------------\nData Retrieval Complete\n------------------------------")

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [None]:
#dictionary
Cities_df = pd.DataFrame({"City": city_name,
                        "Temperature": temp_max,
                        "Humidity": humidity,
                        "Date": date,
                        "Cloudiness" : clouds,
                        "Windspeed": windspeed,
                        "Country": country,
                        "Latitude": latitude,
                        "Longitude": longitude
                         })
Cities_df.to_csv("CitiesDF.csv", index=False)
Cities_df

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

In [None]:
plt.scatter(CitiesDF["Latitude"], CitiesDF["Temperature"])
plt.title("Latitude versus Temperature - April 20th")
plt.xlabel("Latitude")
plt.ylabel("Temperature")
plt.grid(True)
plt.savefig('Lat_v_Temp.png')

## Latitude vs. Humidity Plot

In [None]:
plt.scatter(CitiesDF["Latitude"], CitiesDF["Humidity"])
plt.title("Latitude versus Humidity - April 20th")
plt.xlabel("Latitude")
plt.ylabel("Humidity")
plt.grid(True)
plt.savefig('Lat_v_Humidity.png')

## Latitude vs. Cloudiness Plot

In [None]:

plt.scatter(CitiesDF["Latitude"], CitiesDF["Clouds"])
plt.title("Latitude versus Clouds - April 20th")
plt.xlabel("Latitude")
plt.ylabel("Clouds")
plt.grid(True)
plt.savefig('Lat_v_Cloudiness.png')

## Latitude vs. Wind Speed Plot

In [None]:
plt.scatter(CitiesDF["Latitude"], CitiesDF["Windspeed"])
plt.title("Latitude versus Windspeed - April 20th")
plt.xlabel("Latitude")
plt.ylabel("Windspeed")
plt.grid(True)
plt.savefig('Lat_v_Windspeed.png')

## Linear Regression

In [None]:
# Create Northern and Southern Hemisphere DataFrames
northern_hemisphere = weather_dataframe.loc[weather_dataframe["Lat"] >= 0]
southern_hemisphere = weather_dataframe.loc[weather_dataframe["Lat"] < 0]

#linear regression 
def linear_agression(x,y):
    print(f"The r-squared is : {round(st.pearsonr(x, y)[0],2)}")
    (slope, intercept, rvalue, pvalue, stderr) = linregress(x, y)
    regress_values = x * slope + intercept
    line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
    plt.scatter(x, y)
    plt.plot(x,regress_values,"r-")
    return line_eq
#line of regression
def annotate(line_eq, a, b):
    plt.annotate(line_eq,(a,b),fontsize=15,color="red")

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
equation = linear_agression(northern_hemisphere["Lat"],northern_hemisphere["Temperature"])
annotate(equation, -30, 50)

# Set a title
plt.title("Northern Hemisphere - Max Temp vs. Latitude Linear Regression")
plt.xlabel("Latitude")
plt.ylabel("Max Temp (F)")

# Save the figure
plt.savefig("../Images/Northern Hemisphere - Max Temp vs. Latitude Linear Regression.png")

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
equation = linear_agression(southern_hemisphere["Lat"],southern_hemisphere["Temperature"])
annotate(equation, -30, 50)

# Set a title
plt.title("Southern Hemisphere - Max Temp vs. Latitude Linear Regression")
plt.xlabel("Latitude")
plt.ylabel("Max Temp (F)")

# Save the figure
plt.savefig("../Images/Southern Hemisphere - Max Temp vs. Latitude Linear Regression.png")

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
# getting data
equation = linear_agression(northern_hemisphere["Lat"], northern_hemisphere["Humidity"])
annotate(equation, 40, 15)

# Set a title and labels
plt.title("Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression")
plt.xlabel("Latitude")
plt.ylabel("Humidity (%)")

# Save the figure
plt.savefig("../Images/Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression.png")

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
# getting data
equation = linear_agression(southern_hemisphere["Lat"], southern_hemisphere["Humidity"])
annotate(equation, 40, 15)

# Set a title and labels
plt.title("Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression")
plt.xlabel("Latitude")
plt.ylabel("Humidity (%)")

# Save the figure
plt.savefig("../Images/Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression.png")

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
# getting data
equation = linear_agression(northern_hemisphere["Lat"], northern_hemisphere["Clouds"])
annotate(equation, -30, 40)

# Set a title, labels
plt.title("Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression")
plt.xlabel("Latitude")
plt.ylabel("Cloudiness (%)")

# Save the figure
plt.savefig("../Images/Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression.png")

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:

equation = linear_agression(southern_hemisphere["Lat"], southern_hemisphere["Clouds"])
annotate(equation, -30, 40)
plt.title("Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression")
plt.xlabel("Latitude")
plt.ylabel("Cloudiness (%)")

# Save the figure
plt.savefig("../Images/Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression.png")

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
equation = linear_agression(southern_hemisphere["Lat"], northern_hemisphere["Windspeed"])
annotate(equation, -30, 15)

# Set  title
plt.title("Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression")
plt.xlabel("Latitude")
plt.ylabel("Wind Speed (mph)")
#save
plt.savefig("../Images/Northern Hemisphere - Wind Speed vs. Latitude Linear Regression.png")

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
equation = linear_agression(southern_hemisphere["Lat"], southern_hemisphere["Windspeed"])
annotate(equation, -30, 15)

# Set  title and labels
plt.title("Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression")
plt.xlabel("Latitude")
plt.ylabel("Wind Speed (mph)")

# Save the figure
plt.savefig("../Images/Southern Hemisphere - Wind Speed vs. Latitude Linear Regression.png")