# WeatherPy
----

### Analysis
* As expected, the weather becomes significantly warmer as one approaches the equator (0 Deg. Latitude). More interestingly, however, is the fact that the southern hemisphere tends to be warmer this time of year than the northern hemisphere. This may be due to the tilt of the earth.
* There is no strong relationship between latitude and cloudiness. However, it is interesting to see that a strong band of cities sits at 0, 80, and 100% cloudiness.
* There is no strong relationship between latitude and wind speed. However, in northern hemispheres there is a flurry of cities with over 20 mph of wind.

---

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [4]:
! pip install citipy



In [2]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress
from pprint import pprint

# Import API key
from api_key import api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [8]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
print(len(cities))

602


In [19]:
### Perform API Calls
#Perform a weather check on each city using a series of successive API calls.

#Perform a quick test by coming up with a list of cities with successive API calls
city_test = ['Toronto', 'Paris', 'Zagreb', 'Hoian', 'Windsor', 'Unionville', 'Mississauga', 'Hanoi', 'San Francisco']

#Find url to extract api from owm website
base_url = f"http://api.openweathermap.org/data/2.5/weather?&appid={api_key}&q="

#Create Empty List and set value at city count
city_test_list = []
city_number=1

#Include a print log of each city as it'sbeing processed (with the city number and city name).
for i in city_test:
    city_url = base_url + i
    response_test= requests.get(city_url).json()

    try:
        city_test_list.append(response_test['name'])
        print(f"Processing record {city_number} of|{i}")
        city_number +=1
        
    except:
        # Append null values
        print(f"City not found.  Skipping..")
        pass

    

City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..


In [10]:
# Create empty lists for dataframe to plot data
cityname = []
temperature_max = []
cloudiness =[]
humidity=[]
windspeed=[]
latitude=[]
longitude=[]
date=[]
country = []

print("Beginning Data Retrieval")
print("-----------------------------")

# Set value for record and set count
record = 1
set_number = 1

# Loop through the cities in the full cities list to get all the required weather information through API calls.
# Also, to get a print log of all the cities found from calling the API.


for city in cities:
    weather_url = base_url + city
    response= requests.get(weather_url + "&units=imperial").json()

    try:
        cloudiness.append(response['clouds']['all'])
        country.append(response['sys']['country'])
        date.append(response['dt'])
        humidity.append(response['main']['humidity'])
        latitude.append(response['coord']['lat'])
        longitude.append(response['coord']['lon'])
        temperature_max.append(response['main']['temp_max'])
        windspeed.append(response['wind']['speed'])
        print(f"Processing record {record} of set {set_number}|{city}")
        
        # record and set count
        if record > 49:
            record = 1
            set_number += 1
            cityname.append(city)
        else:
            record += 1
            cityname.append(city)
    except:
        # Append null values
        print(f"City not found.  Skipping..")
        pass
print("-----------------------------")
print("Data Retrieval Complete") 
print("-----------------------------")

Beginning Data Retrieval
-----------------------------
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skip

City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Ski

City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
City not found.  Skipping..
-----------------------------
Data Retrieval Complete
-----------------------------


In [None]:
### Convert Raw Data to DataFrame
# Display the DataFrame
weather_data = pd.DataFrame({
    'City': cityname,
    'Cloudiness': cloudiness,
    'Country': country,
    'Date': date,
    'Humidity': humidity,
    'Latitude': latitude,
    'Longitude': longitude,
    'Max Temperature': temperature_max,
    'Windspeed': windspeed
    
})
weather_data

In [None]:
#count the number of records by columns
weather_data.count()

In [None]:
# Export the city data into a .csv.
weather_data.to_csv("Output Files/weather_data.csv")

### Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

#### Latitude vs. Temperature Plot

In [None]:
# Generate a scatter plot of average tumor volume vs. mouse weight for the Capomulin regimen
plt.scatter(weather_data.iloc[:,5], weather_data.iloc[:,7], marker="o", facecolors="blue", edgecolors="black")

# Formatting the scatter diagram with title, x & y labels, and x & y limits
plt.title ("City Latitude vs Maximum Temperature")
plt.xlabel("Latitude")
plt.ylabel("Max Temperature (F)")
plt.grid()

# Output of scatter plot
plt.show()

# Save scatter plot as png file to output folder
plt.savefig("OutputFiles/Latitude_MaxTemp")

#Calculate r-value
slope, intercept, rvalue, pvalue, stderr = linregress(weather_data.iloc[:,5], weather_data.iloc[:,7])  
rvalue

#### Latitude vs. Humidity Plot

In [None]:
# Generate a scatter plot of average tumor volume vs. mouse weight for the Capomulin regimen
plt.scatter(weather_data.iloc[:,5], weather_data.iloc[:,4], marker="o", facecolors="blue", edgecolors="black")

# Formatting the scatter diagram with title, x & y labels, and x & y limits
plt.title ("City Latitude vs Humidity")
plt.xlabel("Latitude")
plt.ylabel("Humidity (%)")
plt.grid()

# Output of scatter plot
plt.show()

# Save scatter plot as PNG in Output files directory


slope, intercept, rvalue, pvalue, stderr = linregress(weather_data.iloc[:,5], weather_data.iloc[:,4])  
rvalue

#### Latitude vs. Cloudiness Plot

In [None]:
# Generate a scatter plot of average tumor volume vs. mouse weight for the Capomulin regimen
plt.scatter(weather_data.iloc[:,5], weather_data.iloc[:,1], marker="o", facecolors="blue", edgecolors="black")

# Formatting the scatter diagram with title, x & y labels, and x & y limits
plt.title ("City Latitude vs Cloudiness")
plt.xlabel("Latitude")
plt.ylabel("Cloudiness (%)")
plt.grid()

# Output of scatter plot
plt.show()

slope, intercept, rvalue, pvalue, stderr = linregress(weather_data.iloc[:,5], weather_data.iloc[:,1])  
rvalue

#### Latitude vs. Wind Speed Plot

In [None]:
# Generate a scatter plot of average tumor volume vs. mouse weight for the Capomulin regimen
plt.scatter(weather_data.iloc[:,5], weather_data.iloc[:,8], marker="o", facecolors="blue", edgecolors="black")

# Formatting the scatter diagram with title, x & y labels, and x & y limits
plt.title ("City Latitude vs Wind Speed")
plt.xlabel("Latitude")
plt.ylabel("Wind Speed (mph)")
plt.grid()

# Output of scatter plot
plt.show()

slope, intercept, rvalue, pvalue, stderr = linregress(weather_data.iloc[:,5], weather_data.iloc[:,8])  
rvalue