# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from config import key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

605

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [None]:
#variables that need to be stored:
temp = []
humid = []
cloud = []
wind_sp = []
lat = []
lng = []
date = []
country = []
new_city = []
base_url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + key
count =1
record = 1
#testing out the loop

for city in cities:
    print(f'Please wait while we retrieve data on {city}')
    #if count == 25:
        #count +=1
        #record = 0
        #break
    query_url = f"{base_url}&q={city}"   
    record += 1 
#thank you askBCS
    try:   
        response = requests.get(query_url).json()  
        lng.append(response['coord']['lon'])
        lat.append(response['coord']['lat'])
        temp.append(response['main']['temp_max'])
        cloud.append(response['clouds']['all'])
        humid.append(response['main']['humidity'])
        wind_sp.append(response['wind']['speed'])
        date.append(response['dt'])
        country.append(response['sys']['country'])
        new_city.append(response['name'])
    except KeyError:
        print("Data not found")
        pass
    count = count + 1

print(f'End of data retrieval')

Please wait while we retrieve data on lushnje
Please wait while we retrieve data on belushya guba
Data not found
Please wait while we retrieve data on laguna
Please wait while we retrieve data on upernavik
Please wait while we retrieve data on haines junction
Please wait while we retrieve data on kapaa
Please wait while we retrieve data on barrow
Please wait while we retrieve data on mar del plata
Please wait while we retrieve data on rigaud
Please wait while we retrieve data on yellowknife
Please wait while we retrieve data on souillac
Please wait while we retrieve data on ust-kamchatsk
Data not found
Please wait while we retrieve data on ballina
Please wait while we retrieve data on kavieng
Please wait while we retrieve data on honiara
Please wait while we retrieve data on bluff
Please wait while we retrieve data on namwala
Please wait while we retrieve data on busselton
Please wait while we retrieve data on ushuaia
Please wait while we retrieve data on vitim
Please wait while we ret

Data not found
Please wait while we retrieve data on ha tinh
Please wait while we retrieve data on leningradskiy
Please wait while we retrieve data on nouna
Please wait while we retrieve data on pacific grove
Please wait while we retrieve data on okoneshnikovo
Please wait while we retrieve data on yinchuan
Please wait while we retrieve data on tumannyy
Data not found
Please wait while we retrieve data on mulege
Please wait while we retrieve data on tuatapere
Please wait while we retrieve data on boca raton
Please wait while we retrieve data on haapiti
Please wait while we retrieve data on atar
Please wait while we retrieve data on half moon bay
Please wait while we retrieve data on georgetown
Please wait while we retrieve data on dzhebariki-khaya
Please wait while we retrieve data on nova olinda do norte
Please wait while we retrieve data on pointe michel
Please wait while we retrieve data on ponta do sol
Please wait while we retrieve data on shelburne
Please wait while we retrieve dat

Please wait while we retrieve data on amparafaravola
Please wait while we retrieve data on kazalinsk
Data not found
Please wait while we retrieve data on adre
Please wait while we retrieve data on opuwo
Please wait while we retrieve data on moose factory
Please wait while we retrieve data on contamana
Please wait while we retrieve data on honghu
Please wait while we retrieve data on norman wells
Please wait while we retrieve data on oga
Please wait while we retrieve data on poum
Please wait while we retrieve data on chino valley
Please wait while we retrieve data on alofi
Please wait while we retrieve data on sancraiul-de-mures
Data not found
Please wait while we retrieve data on lyubeshiv
Data not found
Please wait while we retrieve data on uyuni
Please wait while we retrieve data on lasa
Please wait while we retrieve data on saint-augustin
Please wait while we retrieve data on temaraia
Data not found
Please wait while we retrieve data on barra dos coqueiros
Please wait while we retri

Please wait while we retrieve data on camabatela
Please wait while we retrieve data on ksenyevka
Data not found
Please wait while we retrieve data on porbandar
Please wait while we retrieve data on kushima
Please wait while we retrieve data on tasbuget
Data not found
Please wait while we retrieve data on lazaro cardenas
Please wait while we retrieve data on szczecinek
Please wait while we retrieve data on qaqortoq
Please wait while we retrieve data on kenora
Please wait while we retrieve data on zharkent
Please wait while we retrieve data on pandua
Please wait while we retrieve data on capaci
Please wait while we retrieve data on novo aripuana
Please wait while we retrieve data on morrinhos
Please wait while we retrieve data on muhoroni
Please wait while we retrieve data on barhiya
Please wait while we retrieve data on petropavlovka
Please wait while we retrieve data on los altos
Please wait while we retrieve data on salekhard
Please wait while we retrieve data on tahta
Please wait whi

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [None]:
#creating dataframe
trip_df = pd.DataFrame({"City": new_city, 
                        "Country": country,
                        "Date": date, "Lat": lat, 
                        "Lng": lng, "Max Temp": temp, 
                        "Humidity": humid, "Cloudiness": cloud,
                        "Wind Speed": wind_sp})
trip_df.head()

In [None]:
#saving data to csv
trip_df.to_csv('WeatherPy.csv')

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

In [None]:
plt.scatter(lat, temp, marker='o', edgecolors="black")
plt.title("Latitude vs Temperature (F)")
plt.xlabel("Latitude")
plt.ylabel("Temperature")
plt.show()
print("Where Latitude is close to 0, higher temperatures can be found")
plt.savefig('LatvsTemp.png')

## Latitude vs. Humidity Plot

In [None]:
plt.scatter(lat, humid, marker = 'o', edgecolors="black")
plt.title("Latitude vs Humidity")
plt.xlabel("Latitude")
plt.ylabel("Humidity")
plt.show()
print("Humidity is higher when latitude is closest to zero")
plt.savefig('Latvshum.png')

## Latitude vs. Cloudiness Plot

In [None]:
plt.scatter(lat, cloud, marker='o', edgecolors="black")
plt.title("Latitude vs Cloudiness")
plt.xlabel("Latitude")
plt.ylabel("Cloudiness")
plt.show()
print("There is no correlation betwwen cloudiness and latitude")
plt.savefig('Latvscloud.png')

## Latitude vs. Wind Speed Plot

In [None]:
plt.scatter(lat, wind_sp, marker='o', edgecolors="black")
plt.title("Latitude vs Wind Speed")
plt.xlabel("Latitude")
plt.ylabel("Wind Speed")
plt.show()
print("There is no correlation between wind speed and latitude")
plt.savefig('Latvswindspeed.png')

## Linear Regression

In [None]:
#if lat >0 northern, <0 southern
#creating new dfs to create graphs
north_hemi = trip_df.loc[trip_df['Lat'] >= 0]
south_hemi = trip_df.loc[trip_df['Lat'] < 0]
north_hemi.head()
south_hemi.head()

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_data = north_hemi['Max Temp']
y_data = north_hemi['Lat']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_data, y_data)
regress = x_data * slope + intercept
line_eq = "y =" + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.scatter(x_data,y_data)
plt.plot(x_data, regress, "r-")
plt.annotate(line_eq, (6,10),fontsize=15,color="red")
plt.xlabel("Temperature")
plt.ylabel("Latitude")
print(f"The r-squared is: {rvalue **2}")
print("As Latitude approaches 0 temperature increases")
plt.show()
plt.savefig('northLatvsTemp.png')

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_data = south_hemi['Max Temp']
y_data = south_hemi['Lat']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_data, y_data)
regress = x_data * slope + intercept
line_eq = "y =" + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.scatter(x_data,y_data)
plt.plot(x_data, regress, "r-")
plt.annotate(line_eq, (6,10),fontsize=15,color="red")
plt.xlabel("Temperature")
plt.ylabel("Latitude")
print(f"The r-squared is: {rvalue **2}")
print("As the latitude approaches 0, the temperature increases")
plt.show()
plt.savefig('southLatvsTemp.png')

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_data = north_hemi['Max Temp']
y_data = north_hemi['Lat']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_data, y_data)
regress = x_data * slope + intercept
line_eq = "y =" + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.scatter(x_data,y_data)
plt.plot(x_data, regress, "r-")
plt.annotate(line_eq, (6,10),fontsize=15,color="red")
plt.xlabel("Humidity %")
plt.ylabel("Latitude")
print(f"The r-squared is: {rvalue **2}")
print("As latitude approaches 0, humidity increases")
plt.show()
plt.savefig('northLatvshum.png')

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_data = south_hemi['Humidity']
y_data = south_hemi['Lat']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_data, y_data)
regress = x_data * slope + intercept
line_eq = "y =" + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.scatter(x_data,y_data)
plt.plot(x_data, regress, "r-")
plt.annotate(line_eq, (6,10),fontsize=15,color="red")
plt.xlabel("Humidity (%)")
plt.ylabel("Latitude")
print(f"The r-squared is: {rvalue **2}")
print("As latitude approaches 0, humidity increases")
plt.show()
plt.savefig('southLatvshum.png')

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_data = north_hemi['Cloudiness']
y_data = north_hemi['Lat']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_data, y_data)
regress = x_data * slope + intercept
line_eq = "y =" + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.scatter(x_data,y_data)
plt.plot(x_data, regress, "r-")
plt.annotate(line_eq, (6,10),fontsize=15,color="red")
plt.xlabel("Cloudiness (%)")
plt.ylabel("Latitude")
print(f"The r-squared is: {rvalue **2}")
print("There is no correlation between cloudiness and latitude")
plt.show()
plt.savefig('northLatvscloud.png')

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_data = south_hemi['Cloudiness']
y_data = south_hemi['Lat']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_data, y_data)
regress = x_data * slope + intercept
line_eq = "y =" + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.scatter(x_data,y_data)
plt.plot(x_data, regress, "r-")
plt.annotate(line_eq, (6,10),fontsize=15,color="red")
plt.xlabel("Cloudiness (%)")
plt.ylabel("Latitude")
print(f"The r-squared is: {rvalue **2}")
print("There is no correlation between cloudiness and latitude")
plt.show()
plt.savefig('southLatvscloud.png')

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_data = north_hemi['Wind Speed']
y_data = north_hemi['Lat']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_data, y_data)
regress = x_data * slope + intercept
line_eq = "y =" + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.scatter(x_data,y_data)
plt.plot(x_data, regress, "r-")
plt.annotate(line_eq, (6,10),fontsize=15,color="red")
plt.xlabel("Windspeed (MPH)")
plt.ylabel("Latitude")
print(f"The r-squared is: {rvalue **2}")
print("There is no correlation between wind speed and latitude")
plt.show()
plt.savefig('northLatvswind.png')

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_data = south_hemi['Wind Speed']
y_data = south_hemi['Lat']
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_data, y_data)
regress = x_data * slope + intercept
line_eq = "y =" + str(round(slope,2)) + "x +" + str(round(intercept,2))
plt.scatter(x_data,y_data)
plt.plot(x_data, regress, "r-")
plt.annotate(line_eq, (6,10),fontsize=15,color="red")
plt.xlabel("Wind Speed (MPH)")
plt.ylabel("Latitude")
print(f"The r-squared is: {rvalue **2}")
print("There is no correlation between wind speed and latitude")
plt.show()
plt.savefig('southLatvswind.png')