# WeatherPy

---

## Starter Code to Generate Random Geographic Coordinates and a List of Cities

In [1]:
%matplotlib inline
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
import scipy.stats as st
from scipy.stats import linregress
import json

# Impor the OpenWeatherMap API key
from api_keys import weather_api_key

# Import citipy to determine the cities based on latitude and longitude
from citipy import citipy



### Generate the Cities List by Using the `citipy` Library

In [2]:
# Empty list for holding the latitude and longitude combinations
lat_lngs = []

# Empty list for holding the cities names
cities = []

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
print(f"Number of cities in the list: {len(cities)}")

Number of cities in the list: 573


In [3]:
cities

['adamstown',
 'yalta',
 'nuuk',
 'wailua homesteads',
 'edinburgh of the seven seas',
 'puerto natales',
 'hami',
 'thompson',
 'papatowai',
 'kindu',
 'olonkinbyen',
 'blackmans bay',
 'cruzeiro do sul',
 'bethel',
 'yellowknife',
 'newman',
 'alotau',
 'gadzhiyevo',
 'iwon-up',
 'portland',
 'namdrik',
 'lewistown',
 'talnakh',
 'keflavik',
 'ribeira grande',
 'whitehorse',
 'talara',
 'cabo san lucas',
 'lihue',
 'longyearbyen',
 'utrik',
 'slave lake',
 'port alfred',
 'hawaiian paradise park',
 'crane',
 'susuman',
 'vadso',
 'ushuaia',
 'grytviken',
 'minas de marcona',
 'iqaluit',
 'petropavlovsk-kamchatsky',
 'port-aux-francais',
 'alice springs',
 'waingapu',
 'kodiak',
 'skutskar',
 'kailua-kona',
 'sandakan',
 'waitangi',
 'daoukro',
 'jayapura',
 'tongouson',
 'guerrero negro',
 'rio preto da eva',
 'margaret river',
 'valle de la pascua',
 'axim',
 'port elizabeth',
 'zuni pueblo',
 'fonte boa',
 'zeya',
 'selfoss',
 'tateyama',
 'mata de sao joao',
 'taiohae',
 'dudinka'

---

## Requirement 1: Create Plots to Showcase the Relationship Between Weather Variables and Latitude

### Use the OpenWeatherMap API to retrieve weather data from the cities list generated in the started code

In [None]:
# Set the API base URL
url = 'https://api.openweathermap.org/data/2.5/weather?'

# Define an empty list to fetch the weather data for each city
city_data = []

# Print to logger
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters
record_count = 1
set_count = 1

# Loop through all the cities in our list to fetch weather data
for i, city in enumerate(cities):
        
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 0

    # Create endpoint URL with each city
    city_url = f"{url}q={city}&units=metric&appid={weather_api_key}"
    
    # Log the url, record, and set numbers
    print("Processing Record %s of Set %s | %s" % (record_count, set_count, city))


     # Add 1 to the record count
    record_count += 1

    # Run an API request for each of the cities
    try:
    # Parse the JSON and retrieve data
        city_weather = requests.get(city_url).json()


        # Parse out latitude, longitude, max temp, humidity, cloudiness, wind speed, country, and date
        city_lat = city_weather['coord']['lat']
        city_lng = city_weather['coord']['lon']
        city_max_temp = city_weather['main']['temp_max']
        city_humidity = city_weather['main']['humidity']
        city_clouds = city_weather['clouds']['all']
        city_wind = city_weather['wind']['speed']
        city_country = city_weather['sys']['country']
        city_date = city_weather['dt']

        # Append the City information into city_data list
        city_data.append({"City": city, 
                          "Lat": city_lat, 
                          "Lng": city_lng, 
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date
                         })

   # If an error is experienced, skip the city
    except:
        print("City not found. Skipping...")
        pass
              
# Indicate that Data Loading is complete 
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | adamstown
Processing Record 2 of Set 1 | yalta
Processing Record 3 of Set 1 | nuuk
Processing Record 4 of Set 1 | wailua homesteads
Processing Record 5 of Set 1 | edinburgh of the seven seas
Processing Record 6 of Set 1 | puerto natales
Processing Record 7 of Set 1 | hami
Processing Record 8 of Set 1 | thompson
Processing Record 9 of Set 1 | papatowai
Processing Record 10 of Set 1 | kindu
Processing Record 11 of Set 1 | olonkinbyen
Processing Record 12 of Set 1 | blackmans bay
Processing Record 13 of Set 1 | cruzeiro do sul
Processing Record 14 of Set 1 | bethel
Processing Record 15 of Set 1 | yellowknife
Processing Record 16 of Set 1 | newman
Processing Record 17 of Set 1 | alotau
City not found. Skipping...
Processing Record 18 of Set 1 | gadzhiyevo
Processing Record 19 of Set 1 | iwon-up
Processing Record 20 of Set 1 | portland
Processing Record 21 of Set 1 | namdrik
Processing Record 22 of Se

Processing Record 39 of Set 4 | gaspe
Processing Record 40 of Set 4 | hermanus
Processing Record 41 of Set 4 | cannonvale
Processing Record 42 of Set 4 | regina
Processing Record 43 of Set 4 | mikun'
Processing Record 44 of Set 4 | ad dilam
Processing Record 45 of Set 4 | la passe
Processing Record 46 of Set 4 | egilsstadir
Processing Record 47 of Set 4 | sitka
Processing Record 48 of Set 4 | trinity beach
Processing Record 49 of Set 4 | likiep
Processing Record 0 of Set 5 | ancud
Processing Record 1 of Set 5 | cascais
Processing Record 2 of Set 5 | rongelap
Processing Record 3 of Set 5 | pospelikha
Processing Record 4 of Set 5 | yangshuo
Processing Record 5 of Set 5 | woolgoolga
Processing Record 6 of Set 5 | kangding
Processing Record 7 of Set 5 | margate
Processing Record 8 of Set 5 | boende
Processing Record 9 of Set 5 | buala
Processing Record 10 of Set 5 | port lincoln
Processing Record 11 of Set 5 | bardai
Processing Record 12 of Set 5 | ahau
City not found. Skipping...
Processi

Processing Record 33 of Set 8 | malabar
Processing Record 34 of Set 8 | mata-utu
Processing Record 35 of Set 8 | tanrake village
City not found. Skipping...
Processing Record 36 of Set 8 | labrador city
Processing Record 37 of Set 8 | mwatate
Processing Record 38 of Set 8 | mili
Processing Record 39 of Set 8 | areia
Processing Record 40 of Set 8 | mogadishu
Processing Record 41 of Set 8 | yanbu
Processing Record 42 of Set 8 | vila franca do campo
Processing Record 43 of Set 8 | lorengau
Processing Record 44 of Set 8 | san luis de la loma
Processing Record 45 of Set 8 | labuan
Processing Record 46 of Set 8 | lodwar
Processing Record 47 of Set 8 | west fargo
Processing Record 48 of Set 8 | nema
Processing Record 49 of Set 8 | coquimbo
Processing Record 0 of Set 9 | kutum
Processing Record 1 of Set 9 | san rafael del yuma
Processing Record 2 of Set 9 | tranovaho
City not found. Skipping...
Processing Record 3 of Set 9 | matoury
Processing Record 4 of Set 9 | sisimiut
Processing Record 5 o

In [None]:
# Convert the cities weather data into a Pandas DataFrame
city_data_df = pd.DataFrame(city_data)

# Show Record Count
city_data_df.count()



In [None]:
# Display sample data
city_data_df.head()



In [None]:
import os

# Create the output_data directory if it doesn't exist
output_data_dir = 'output_data'
os.makedirs(output_data_dir, exist_ok=True)

# Save the CSV file in the output_data directory
csv_path = os.path.join(output_data_dir, 'cities.csv')
city_data_df.to_csv(csv_path, index_label="City_ID")


# Export the City_Data into a csv
city_data_df.to_csv("output_data/cities.csv", index_label="City_ID")



In [None]:
# Read saved data
city_data_df = pd.read_csv("output_data/cities.csv", index_col="City_ID")

# Display sample data
city_data_df.head()




### Create the Scatter Plots Requested

#### Latitude Vs. Temperature

In [None]:
# Build scatter plot for latitude vs. temperature
plt.scatter(city_data_df['Lat'],city_data_df['Max Temp'], marker='o', edgecolor='black')

# Incorporate the other graph properties
plt.xlabel('Latitude')
plt.ylabel('Max Temperature(C)')
plt.title('City Latitude vs.Temperature')
plt.grid()

# Save the figure
plt.savefig("output_data/Fig1.png")

# Show plot
plt.show()



#### Latitude Vs. Humidity

In [None]:
# Build the scatter plots for latitude vs. humidity
plt.scatter(city_data_df['Lat'],city_data_df['Humidity'], marker='o', edgecolor='black')

# Incorporate the other graph properties
plt.xlabel('Latitude')
plt.ylabel('Humidity(%)')
plt.title('City Latitude vs. Humidity')
plt.grid()

# Save the figure
plt.savefig("output_data/Fig2.png")

# Show plot
plt.show()



#### Latitude Vs. Cloudiness

In [None]:
# Build the scatter plots for latitude vs. cloudiness
plt.scatter(city_data_df['Lat'],city_data_df['Cloudiness'], marker='o', edgecolor='black')

# Incorporate the other graph properties
plt.xlabel('Latitude')
plt.ylabel('Cloudiness(%)')
plt.title('City Latitude vs.Cloudiness')
plt.grid()

# Save the figure
plt.savefig("output_data/Fig3.png")

# Show plot
plt.show()



#### Latitude vs. Wind Speed Plot

In [None]:
# Build the scatter plots for latitude vs. wind speed
plt.scatter(city_data_df['Lat'],city_data_df['Wind Speed'], marker='o', edgecolor='black')

# Incorporate the other graph properties
plt.xlabel('Latitude')
plt.ylabel('Wind Speed(m/s)')
plt.title('City Latitude vs.Wind Speed')
plt.grid()

# Save the figure
plt.savefig("output_data/Fig4.png")

# Show plot
plt.show()



---

## Requirement 2: Compute Linear Regression for Each Relationship


In [None]:
# Define a function to create Linear Regression plots
def linear_reg(x_axis, y_axis,eq_loc):  
    correlation = st.pearsonr(x_axis,y_axis)
    p_slope, p_int, p_r, p_p, p_std_err = st.linregress(x_axis, y_axis)
    p_fit = p_slope * x_axis + p_int
    eq= f"y ={p_slope: .2f}x +{ p_int: .2f}"
       
    #Plot the line
    plt.scatter(x_axis, y_axis ,marker="o")
    plt.plot(x_axis,p_fit,"--", color='red')
    plt.annotate(eq, eq_loc, fontsize=12, color='red')
    print(f"The r-value between {x_axis.name} and {y_axis.name} is {round(correlation[0],2)}")



In [None]:
# Create a DataFrame with the Northern Hemisphere data (Latitude >= 0)
northern_hemi_df = city_data_df.loc[city_data_df['Lat']>=0]

# Display sample data
northern_hemi_df.head()



In [None]:
# Create a DataFrame with the Southern Hemisphere data (Latitude < 0)
southern_hemi_df = city_data_df.loc[city_data_df['Lat']<0]

# Display sample data
southern_hemi_df.head()



###  Temperature vs. Latitude Linear Regression Plot

In [None]:
# Linear regression on Northern Hemisphere
linear_reg(northern_hemi_df['Lat'], northern_hemi_df['Max Temp'], (10, -10))
plt.xlabel('Latitude')
plt.ylabel('Temperature(C)')



In [None]:
# Linear regression on Southern Hemisphere
linear_reg(southern_hemi_df['Lat'], southern_hemi_df['Max Temp'], (-30, 5))
plt.xlabel('Latitude')
plt.ylabel('Temperature(C)')


**Discussion about the linear relationship:** The northern and southern hemispheres are opposite of one another. Meaning that in the northern hemisphere - the higher the altitude the colder the weather, while the southern hemisphere is the opposite of that. 

### Humidity vs. Latitude Linear Regression Plot

In [None]:
# Northern Hemisphere
# Northern Hemisphere
linear_reg(northern_hemi_df['Lat'], northern_hemi_df['Humidity'],(55, 10))
plt.xlabel('Latitude')
plt.ylabel('Humidity(%)')



In [None]:
# Southern Hemisphere
# Southern Hemisphere
linear_reg(southern_hemi_df['Lat'], southern_hemi_df['Humidity'],(-50, 25))
plt.xlabel('Latitude')
plt.ylabel('Humidity(%)')



**Discussion about the linear relationship:** Both northern and southern hemispheres have a weak correlation with latitude and humidity

### Cloudiness vs. Latitude Linear Regression Plot

In [None]:
# Northern Hemisphere
linear_reg(northern_hemi_df['Lat'], northern_hemi_df['Cloudiness'],(50, 50))
plt.xlabel('Latitude')
plt.ylabel('Cloudiness(%)')


In [None]:
# Southern Hemisphere
linear_reg(southern_hemi_df['Lat'], southern_hemi_df['Cloudiness'],(-50, 65))
plt.xlabel('Latitude')
plt.ylabel('Cloudiness(%)')


**Discussion about the linear relationship:** 

### Wind Speed vs. Latitude Linear Regression Plot

In [None]:
# Northern Hemisphere
linear_reg(northern_hemi_df['Lat'], northern_hemi_df['Wind Speed'],(10, 12))
plt.xlabel('Latitude')
plt.ylabel('Wind Speed(m/s)')


In [None]:
# Southern Hemisphere
linear_reg(southern_hemi_df['Lat'], southern_hemi_df['Wind Speed'],(-50, 9))
plt.xlabel('Latitude')
plt.ylabel('Wind Speed(m/s)')


**Discussion about the linear relationship:** YOUR RESPONSE HERE