# WeatherPy

---

## Starter Code to Generate Random Geographic Coordinates and a List of Cities

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import the OpenWeatherMap API key
from api_keys import weather_api_key

# Import citipy to determine the cities based on latitude and longitude
from citipy import citipy

# Output file (CSV)
output_data_file = "C:/Users/emich/Desktop/penn data science bootcamp/Mod6_Assignment/python-api-challenge/output_data/cities.csv"

ModuleNotFoundError: No module named 'api_keys'

### Generate the Cities List by Using the `citipy` Library

In [None]:
# Empty list for holding the latitude and longitude combinations
lat_lngs = []

# Empty list for holding the cities names
cities = []

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    country = citipy.nearest_city(lat_lng[0], lat_lng[1]).country_code
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)
        countries.append(country.upper())

# Print the city count to confirm sufficient count
print(f"Number of cities in the list: {len(cities)}")
print(len(cities))

# Print the country count to confirm it matches the city count
print(len(countries))

---

## Requirement 1: Create Plots to Showcase the Relationship Between Weather Variables and Latitude

### Use the OpenWeatherMap API to retrieve weather data from the cities list generated in the started code

In [None]:
# Set the API base URL
base_url = "http://api.openweathermap.org/data/2.5/weather?"
unit = "units=Imperial"

# Create counters to parse through the data
record_count = 1
set_count = 1

# Create the DataFrame
city_data = pd.DataFrame({"City":cities})


# Define an empty list to fetch the weather data for each city
city_data["Country"] = ""
city_data["Date"] = ""
city_data["Latitude"] = ""
city_data["Longitude"] = ""
city_data["Cloudiness (%)"] = ""
city_data["Humidity (%)"] = ""
city_data["Max Temp (C)"] = ""
city_data["Wind Speed (mph)"] = ""

# Print to logger
print("Beginning Data Retrieval     ")
print("-----------------------------")


# Loop through all the cities in our list to fetch weather data
for index, row in city_data.iterrows():
    city = row[City]
        
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 0

    # Create endpoint URL with each city
    city_url = base_url + '&appid=' + weather_api_key + "&q=" + city
    
    # Log the url, record, and set numbers
    print("Processing Record %s of Set %s | %s" % (record_count, set_count, city))

    # Add 1 to the record count
    record_count += 1

    # Run an API request for each of the cities
    try:
        # Parse the JSON and retrieve data
        city_weather = requests.get(base_url).json()
        
        # Parse out latitude, longitude, max temp, humidity, cloudiness, wind speed, country, and date
        city_data.loc[index, "Country"] = city_weather["sys"]["country"]
        city_data.loc[index, "Date"] = datetime.datetime.fromtimestamp(city_weater["dt"])
        city_data.loc[index, "Latitude"] = city_weather["coord"]["lat"]
        city_data.loc[index, "Longitude"] = city_weather["coord"]["lng"]
        city_data.loc[index, "Cloudiness (%)"] = city_weather["clouds"]["all"]
        city_data.loc[index, "Humidity (%)"] = city_weather["main"]["humidity"]
        city_data.loc[index, "Max Temp (C)"] = city_weather["main"]["temp_max"]
        city_data.loc[index, 'Windspeed (mph)'] = city_weather["wind"]["speed"]
        

        # Append the City information into city_data list
        city_data.append({"City": city, 
                          "Lat": city_lat, 
                          "Lng": city_lng, 
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

    # If an error is experienced, skip the city
    except:
        print(f"City not found. Skipping{city}...")
        pass
              
# Indicate that Data Loading is complete 
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

In [None]:
# Convert the cities weather data into a Pandas DataFrame
city_data_df = pd.DataFrame(city_data)
city_data_df

# Export DataFrame as a csv file
city_data_df.to_csv(output_data_file, index_label="City_ID")

# Preview the table/DF
city_data_df

# Show Record Count
city_data_df.count()

In [None]:
# Display sample data
city_data_df.head()

In [None]:
# Export the City_Data into a csv
city_data_df.to_csv("C:/Users/emich/Desktop/penn data science bootcamp/Mod6_Assignment/python-api-challenge/output_data/cities.csv", index_label="City_ID")

In [None]:
# Read saved data
city_data_df = pd.read_csv("C:/Users/emich/Desktop/penn data science bootcamp/Mod6_Assignment/python-api-challenge/output_data/cities.csv", index_col="City_ID")

# Display sample data
city_data_df.head()

### Create the Scatter Plots Requested

#### Latitude Vs. Temperature

In [None]:
# Build scatter plot for latitude vs. temperature
x_values = city_data_df["Lat"]
y_values = city_data_df["Max Temp"]

# Incorporate the other graph properties
fig1, ax1 = plt.subplots(figsize=(11,8))
plt.scatter(x_values, y_values, edgecolor = "black", linewidth = 1, marker = "o", alpha = 0.8)
plt.title(f"City Latitude versus Max Temperature")
plt.xlabel("Latitude")
plt.ylabel("Max Temperature (F)")
plt.grid()

# Save the figure
plt.savefig("C:/Users/emich/Desktop/penn data science bootcamp/Mod6_Assignment/python-api-challenge/output_data/Fig1.png")

# Show plot
plt.show()

#### Latitude Vs. Humidity

In [None]:
# Build the scatter plots for latitude vs. humidity
x_values = city_data_df["Lat"]
y_values = city_data_df["Humidity"]

# Incorporate the other graph properties
fig1, ax1 = plt.subplots(figsize= (11, 8))
plt.scatter(x_values, y_values, edgecolor = "black", linewidth = 1, marker = "o", alpha = 0.8)
plt.xlabel("Latitude")
plt.ylabel("Humidity (%)")
plt.title(f"City Latitude versus Humidity")
plt.grid()

# Save the figure
plt.savefig("C:/Users/emich/Desktop/penn data science bootcamp/Mod6_Assignment/python-api-challenge/output_data/Fig2.png")

# Show plot
plt.show()

#### Latitude Vs. Cloudiness

In [None]:
# Build the scatter plots for latitude vs. cloudiness
x_values = city_data_df["Lat"]
y_values = city_data_df["Cloudiness"]

# Incorporate the other graph properties
fig1, ax1 = plt.subplots(figsize= (10,8))
markersize=12
plt.scatter(x_values, y_values, edgecolor= "black", linewidth= 1, marker= "o", alpha= 0.8)
plt.xlabel("Latitude")
plt.ylabel("Cloudiness (%)")
plt.title(f"City Latitude vs. Cloudiness")
plt.grid()

# Save the figure
plt.savefig("C:/Users/emich/Desktop/penn data science bootcamp/Mod6_Assignment/python-api-challenge/output_data/Fig3.png")

# Show plot
plt.show()

#### Latitude vs. Wind Speed Plot

In [None]:
# Build the scatter plots for latitude vs. wind speed
x_values = city_data_df["Lat"]
y_values = city_data_df["Wind Speed"]

# Incorporate the other graph properties
fig1, ax1 = plt.subplots(figsize= (10,8))
plt.scatter(x_values, y_values, edgecolor= "black", linewidth= 1, marker= "o", alpha= 0.8)
plt.xlabel("Latitude")
plt.ylabel("Wind Speed (MPH)")
plt.title(f"City Latitude versus Wind Speed")
plt.grid()

# Save the figure
plt.savefig("C:/Users/emich/Desktop/penn data science bootcamp/Mod6_Assignment/python-api-challenge/output_data/Fig4.png")

# Show plot
plt.show()

---

## Requirement 2: Compute Linear Regression for Each Relationship


In [None]:
# Define a function to create Linear Regression plots
(regr_slope, regr_intercept, regr_r_val, _, _) = linregress(df[x_Col], df[y_Col])

regr_line_x = np.array([a for a in range(int(min(df[x_Col].values)), int(max(df[x_Col].values)+1))])
regr_line_y = regr_slope + regr_line_x + regr_intercept

df_axes = df.plot(kind= "scatter", x=x_Col, y=y_Col,
                 title="{} vs. {} ({})"
                 .format(y_Col, x_Col, ))

In [None]:
# Create a DataFrame with the Northern Hemisphere data (Latitude >= 0)
x_axis = northern_hemi_df["Lat"]
y_axis = northern_hemi_df["Max Temp"]
y_title = "Max Temperature (C)"

regression_line(x_axis, y_axis, y_title)

# Display sample data
northern_hemi_df.head()

In [None]:
# Create a DataFrame with the Southern Hemisphere data (Latitude < 0)
# YOUR CODE HERE

# Display sample data
southern_hemi_df.head()

###  Temperature vs. Latitude Linear Regression Plot

In [None]:
# Linear regression on Northern Hemisphere
x_axis

In [None]:
# Linear regression on Southern Hemisphere
# YOUR CODE HERE

**Discussion about the linear relationship:** YOUR RESPONSE HERE

### Humidity vs. Latitude Linear Regression Plot

In [None]:
# Northern Hemisphere
# YOUR CODE HERE

In [None]:
# Southern Hemisphere
# YOUR CODE HERE

**Discussion about the linear relationship:** YOUR RESPONSE HERE

### Cloudiness vs. Latitude Linear Regression Plot

In [None]:
# Northern Hemisphere
# YOUR CODE HERE

In [None]:
# Southern Hemisphere
# YOUR CODE HERE

**Discussion about the linear relationship:** YOUR RESPONSE HERE

### Wind Speed vs. Latitude Linear Regression Plot

In [None]:
# Northern Hemisphere
# YOUR CODE HERE

In [None]:
# Southern Hemisphere
# YOUR CODE HERE

**Discussion about the linear relationship:** YOUR RESPONSE HERE