# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

620

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [3]:
url = "http://api.openweathermap.org/data/2.5/weather?"
units = "imperial"

# Build partial query URL
query_url = f"{url}appid={weather_api_key}&units={units}&q="
#print (query_url)

for index, city in np.ndenumerate(cities):
    print(index[0],": ", city)

0 :  hobart
1 :  yeppoon
2 :  jega
3 :  barrow
4 :  te anau
5 :  barentsburg
6 :  illoqqortoormiut
7 :  hithadhoo
8 :  bredasdorp
9 :  ushuaia
10 :  rikitea
11 :  riviere-au-renard
12 :  norman wells
13 :  cockburn town
14 :  albany
15 :  new norfolk
16 :  mattawa
17 :  aklavik
18 :  umm kaddadah
19 :  mataura
20 :  cherskiy
21 :  punta arenas
22 :  atuona
23 :  narsaq
24 :  lebu
25 :  caravelas
26 :  margate
27 :  saskylakh
28 :  dikson
29 :  geraldton
30 :  bestobe
31 :  ribeira grande
32 :  makasar
33 :  bluff
34 :  lompoc
35 :  vaini
36 :  jardim
37 :  castro
38 :  thompson
39 :  ahipara
40 :  acuna
41 :  piacabucu
42 :  sri aman
43 :  avarua
44 :  mys shmidta
45 :  north bend
46 :  cabo san lucas
47 :  georgetown
48 :  meulaboh
49 :  petropavlovsk-kamchatskiy
50 :  los llanos de aridane
51 :  tuktoyaktuk
52 :  saint-philippe
53 :  ostrovnoy
54 :  avera
55 :  aldan
56 :  djibo
57 :  mehamn
58 :  lorengau
59 :  matara
60 :  jalu
61 :  taolanaro
62 :  starozhilovo
63 :  hovd
64 :  ma

In [5]:
#http://api.openweathermap.org/data/2.5/weather?appid=a06654f281500ab038da9f513e3722b3&units=imperial&q=

In [None]:
# set up lists to hold reponse info
city = []
cloudiness = []
country=[]
date=[]
humidity=[]
lat=[]
lng=[]
max_temp=[]
wind_speed=[]
# Loop through the list of cities and perform a request for data on each
#cities = ["east london"]
for city_ in cities:
    #print(requests.get(query_url + city_).url)
    response = requests.get(query_url + city_).json()
    #pprint(response)
    try:
        city.append(response['name'])
        cloudiness.append(response['clouds']['all'])
        country.append(response['sys']['country'])
        date.append(response['dt'])
        humidity.append(response['main']['humidity'])
        lat.append(response['coord']['lat'])
        lng.append(response['coord']['lon'])
        max_temp.append(response['main']['temp_max'])
        wind_speed.append(response['wind']['speed'])
        print(f"{city_} FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>")
    except:
        print(f"{city_} NOT FOUND *********")
        pass

hobart FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
yeppoon FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
jega FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
barrow FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
te anau FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
barentsburg NOT FOUND *********
illoqqortoormiut NOT FOUND *********
hithadhoo FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
bredasdorp FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
ushuaia FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
rikitea FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
riviere-au-renard FOUND <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<>>>>>>>>>>>>>>>>>>

In [None]:
weather_dict = {
    "City": city,
    "Cloudiness": cloudiness,
    "Country": country,
    "Date": date,
    "Humidity":humidity,
    "Lat": lat,
    "Lng": lng,
    "Max temp": max_temp,
    "Wind Speed": wind_speed,
    
}
weather_data = pd.DataFrame(weather_dict)
weather_data.to_csv("./output_data2/weatherdata2.csv",index_label="CityID")
weather_data

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

### Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

#### Latitude vs. Temperature Plot

In [None]:

plt.scatter(weather_data['Lat'],weather_data["Max temp"], marker="h", facecolors="red", edgecolors="black", alpha=0.75)
plt.title("City Latitude vs Max Temperature (01/25/20)")
plt.xlabel("Latitude")
plt.ylabel("Max Temperature (F) ")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig1.png")
plt.show()


#### Latitude vs. Humidity Plot

In [None]:
plt.scatter(weather_data['Lat'],weather_data["Humidity"], marker="h", facecolors="red", edgecolors="black", alpha=0.75)
plt.title("City Latitude vs Humidity (01/25/20)")
plt.xlabel("Latitude")
plt.ylabel("Humidity (%) ")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig2.png")
plt.show()

#### Latitude vs. Cloudiness Plot

In [None]:
plt.scatter(weather_data['Lat'],weather_data["Cloudiness"], marker="h", facecolors="red", edgecolors="black", alpha=0.75)
plt.title("City Latitude vs Cloudliness (01/25/20)")
plt.xlabel("Latitude")
plt.ylabel("Cloudliness (%) ")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig3.png")
plt.show()

#### Latitude vs. Wind Speed Plot

In [None]:
plt.scatter(weather_data['Lat'],weather_data["Wind Speed"], marker="h", facecolors="red", edgecolors="black", alpha=0.75)
plt.title("City Latitude vs Wind Speed (01/25/20)")
plt.xlabel("Latitude")
plt.ylabel("Wind Speed (mph) ")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig4.png")
plt.show()

## Linear Regression

In [None]:
# OPTIONAL: Create a function to create Linear Regression plots


In [None]:
weather_dataN = weather_data[weather_data.Lat>0]
weather_dataN
weather_dataS = weather_data[weather_data.Lat<0]
weather_dataS

In [None]:
# Create Northern and Southern Hemisphere DataFrames


####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_values = weather_dataN["Lat"]
y_values = weather_dataN["Max temp"]
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Max Temp')
print(f"The r-squared is: {rvalue}")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig5.png")
plt.show()

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_values = weather_dataS["Lat"]
y_values = weather_dataS["Max temp"]
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Max Temp')
print(f"The r-squared is: {rvalue}")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig6.png")
plt.show()

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_values = weather_dataN["Lat"]
y_values = weather_dataN["Humidity"]
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Humidity')
print(f"The r-squared is: {rvalue}")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig7.png")
plt.show()

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_values = weather_dataS["Lat"]
y_values = weather_dataS["Humidity"]
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(-50,20),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel('Humidity')
print(f"The r-squared is: {rvalue}")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig8.png")
plt.show()

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_values = weather_dataN["Lat"]
y_values = weather_dataN["Cloudiness"]
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(6,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel("Cloudiness")
print(f"The r-squared is: {rvalue}")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig9.png")
plt.show()

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_values = weather_dataS["Lat"]
y_values = weather_dataS["Cloudiness"]
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(-50,10),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel("Cloudiness")
print(f"The r-squared is: {rvalue}")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig10.png")
plt.show()

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_values = weather_dataN["Lat"]
y_values = weather_dataN["Wind Speed"]
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(40,25),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel("Wind Speed")
print(f"The r-squared is: {rvalue}")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig11.png")
plt.show()

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_values = weather_dataS["Lat"]
y_values = weather_dataS["Wind Speed"]
(slope, intercept, rvalue, pvalue, stderr) = linregress(x_values, y_values)
regress_values = x_values * slope + intercept
line_eq = "y = " + str(round(slope,2)) + "x + " + str(round(intercept,2))
plt.scatter(x_values,y_values)
plt.plot(x_values,regress_values,"r-")
plt.annotate(line_eq,(-30,20),fontsize=15,color="red")
plt.xlabel('Latitude')
plt.ylabel("Wind Speed")
print(f"The r-squared is: {rvalue}")
plt.savefig("/Users/khushbooshah/Desktop/My work/Homework/python-api-challenge/VacationPy/output_data2/Myfig12.png")
plt.show()

In [None]:
Observable Trends

After plotting scatter plot and running regression analysis on 558 cities based on their location,  weather, temperature and various other parameters, all scattered across globe the following trends can be observed with certain confidence:

	The Max temperature of a city is directly related to its proximity from the Equator. The closer a city is to the equator the higher its Max temperature and vice versa.(MyFig1). This can also be seen by the correlation coefficient (r) for the variables Max Temp and Latitude for the Northern Hemisphere  -0.87432 which signifies a very strong inverse relationship between both of the variables.(MyFig5)

	Upon observing the Cloudiness vis-à-vis the Latitude of a location it can be observed that the cloudiness is particularly higher or concentrated in areas where there is a land mass (continents) vs above oceans.(MyFig3)


	From looking at the plots for the variables Wind Speed and Latitude it can be observed that the burst of high wind speeds i.e. the outliers seem to fall in the extreme values of the Latitude (the north and the south poles) (MyFig4)


