In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [2]:
#Add the code that generates the latitudes and longitudes, but first, they need to be stored so that we can access them later. 
#Since we are creating arrays of latitudes and longitudes, we'll declare each array as a variable.

In [3]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7fa54d22d960>

In [4]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [5]:
# Use the citipy module to determine city based on latitude and longitude.
from citipy import citipy

In [6]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

628

In [7]:
#Some of this code should look familiar, but let's break it down:
#We create a cities list to store city names.
#We iterate through the coordinates, as in our practice, 
#and retrieve the nearest city using the latitude and longitude pair.
#We add a decision statement with the logical operator not in to determine 
#whether the found city is already in the cities list. If not, then we'll use the append() function to add it. 
#We are doing this because among the 1,500 latitudes and longitudes, there might be duplicates, 
#which will retrieve duplicate cities, and we want to be sure we capture only the unique cities.

In [8]:
#Now that we know how to get all the weather data from a JSON response, 
#we can iterate through our cities list and retrieve the data from each city.

#We will need to do the following:

#Import our dependencies and initialize counters and an empty list that will hold the weather data.
#Loop through the cities list.
#Group the cities in sets of 50 to log the process as we find the weather data for each city.
#Two counters will be needed here: one to log the city count from 1 to 50, and another for the sets.
#Build the city_url or endpoint for each city.
#Log the URL and the record and set numbers.
#Make an API request for each city.
#Parse the JSON weather data for the following:
#City, country, and date
#Latitude and longitude
#Maximum temperature
#Humidity
#Cloudiness
#Wind speed
#Add the data to a list in a dictionary format and then convert the list to a DataFrame.


In [9]:
city_data = []

In [10]:
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

# Import the time library and the datetime module from the datetime library 
import time
from datetime import datetime

In [11]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

#In the code block, we have initialized the counters at 1 because we want the first iteration of the logging 
#for each recorded response and the set to start at 1.

Beginning Data Retrieval     
-----------------------------


In [12]:
#Next, we need to iterate through our list of cities and begin building the URL for each city, 
#while grouping our records in sets of 50. To do this, use for i in range(len(cities)) 
#and the index to tell us when we get to 50.

# Loop through all the cities in our list.
#Every time we want to reference the city in our code, we need to use the indexing on the cities list. 
#Unfortunately, this will cause programming errors when we are building the city_url 
#because it adds the index, not the city name, to the city_url. To fix this issue, 
#we need to create another for loop to get the city from the cities list.
#------------------------------------------------------------------------------
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" 

for i, city in enumerate(cities):
    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
#Once we get to 50, we tell the program to pause for 60 seconds using the time.sleep(60) command. 
#The OpenWeatherMap API only allows 60 calls for per minute on their free tier, 
#so pausing our program for one minute after each set of 50 will prevent time-out errors. 
        time.sleep(60)
#We can also retrieve the city from the cities list and add it to the city_url by using indexing,    
    city_url = url + "&q=" + cities[i]
    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1

Processing Record 1 of Set 1 | bhaderwah
Processing Record 2 of Set 1 | maholi
Processing Record 3 of Set 1 | ushuaia
Processing Record 4 of Set 1 | tasiilaq
Processing Record 5 of Set 1 | taolanaro
Processing Record 6 of Set 1 | bethel
Processing Record 7 of Set 1 | busselton
Processing Record 8 of Set 1 | meulaboh
Processing Record 9 of Set 1 | chokurdakh
Processing Record 10 of Set 1 | nizhneyansk
Processing Record 11 of Set 1 | san cristobal
Processing Record 12 of Set 1 | vaini
Processing Record 13 of Set 1 | punta arenas
Processing Record 14 of Set 1 | east london
Processing Record 15 of Set 1 | cabo san lucas
Processing Record 16 of Set 1 | nara
Processing Record 17 of Set 1 | new norfolk
Processing Record 18 of Set 1 | harper
Processing Record 19 of Set 1 | georgetown
Processing Record 20 of Set 1 | rikitea
Processing Record 21 of Set 1 | ballina
Processing Record 22 of Set 1 | yellowknife
Processing Record 23 of Set 1 | bambous virieux
Processing Record 24 of Set 1 | mataura
P

Processing Record 1 of Set 5 | karratha
Processing Record 2 of Set 5 | turkan
Processing Record 3 of Set 5 | sao jose da coroa grande
Processing Record 4 of Set 5 | cayenne
Processing Record 5 of Set 5 | mitsamiouli
Processing Record 6 of Set 5 | sigayevo
Processing Record 7 of Set 5 | nagua
Processing Record 8 of Set 5 | bonthe
Processing Record 9 of Set 5 | qaanaaq
Processing Record 10 of Set 5 | simplicio mendes
Processing Record 11 of Set 5 | guerrero negro
Processing Record 12 of Set 5 | tomatlan
Processing Record 13 of Set 5 | coffs harbour
Processing Record 14 of Set 5 | kavaratti
Processing Record 15 of Set 5 | antofagasta
Processing Record 16 of Set 5 | constitucion
Processing Record 17 of Set 5 | amderma
Processing Record 18 of Set 5 | okhotsk
Processing Record 19 of Set 5 | hun
Processing Record 20 of Set 5 | saskylakh
Processing Record 21 of Set 5 | longyearbyen
Processing Record 22 of Set 5 | samusu
Processing Record 23 of Set 5 | kawana waters
Processing Record 24 of Set 

Processing Record 1 of Set 9 | burica
Processing Record 2 of Set 9 | west plains
Processing Record 3 of Set 9 | nouadhibou
Processing Record 4 of Set 9 | flinders
Processing Record 5 of Set 9 | chulym
Processing Record 6 of Set 9 | cedar city
Processing Record 7 of Set 9 | sahawar
Processing Record 8 of Set 9 | teahupoo
Processing Record 9 of Set 9 | touros
Processing Record 10 of Set 9 | champerico
Processing Record 11 of Set 9 | chhabra
Processing Record 12 of Set 9 | ostrovnoy
Processing Record 13 of Set 9 | helena
Processing Record 14 of Set 9 | ilulissat
Processing Record 15 of Set 9 | lago da pedra
Processing Record 16 of Set 9 | sosva
Processing Record 17 of Set 9 | goderich
Processing Record 18 of Set 9 | masuguru
Processing Record 19 of Set 9 | kodinsk
Processing Record 20 of Set 9 | dolny kubin
Processing Record 21 of Set 9 | lorengau
Processing Record 22 of Set 9 | coppell
Processing Record 23 of Set 9 | skelleftea
Processing Record 24 of Set 9 | altus
Processing Record 25 o

Processing Record 1 of Set 13 | tetiyiv
Processing Record 2 of Set 13 | ust-uda
Processing Record 3 of Set 13 | ambulu
Processing Record 4 of Set 13 | alanya
Processing Record 5 of Set 13 | toliary
Processing Record 6 of Set 13 | wanning
Processing Record 7 of Set 13 | sobolevo
Processing Record 8 of Set 13 | mbandaka
Processing Record 9 of Set 13 | greenville
Processing Record 10 of Set 13 | omboue
Processing Record 11 of Set 13 | zverinogolovskoye
Processing Record 12 of Set 13 | kawalu
Processing Record 13 of Set 13 | karasburg
Processing Record 14 of Set 13 | poltavka
Processing Record 15 of Set 13 | pavelets
Processing Record 16 of Set 13 | wattegama
Processing Record 17 of Set 13 | moulins
Processing Record 18 of Set 13 | missoula
Processing Record 19 of Set 13 | panguma
Processing Record 20 of Set 13 | qurunbaliyah
Processing Record 21 of Set 13 | maumere
Processing Record 22 of Set 13 | coolum beach
Processing Record 23 of Set 13 | cottbus
Processing Record 24 of Set 13 | north

In [13]:
# Run an API request for each of the cities.Module 6.2.6
try:
        # Parse the JSON and retrieve data.
    city_weather = requests.get(city_url).json()
        # Parse out the needed data.
    city_lat = city_weather["coord"]["lat"]
    city_lng = city_weather["coord"]["lon"]
    city_max_temp = city_weather["main"]["temp_max"]
    city_humidity = city_weather["main"]["humidity"]
    city_clouds = city_weather["clouds"]["all"]
    city_wind = city_weather["wind"]["speed"]
    city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
    city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
    city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
except:
    print("City not found. Skipping...")
    pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

City not found. Skipping...
-----------------------------
Data Retrieval Complete      
-----------------------------


In [14]:
#6.2.7 Creating a dataframe of City weather

In [16]:
#Recall that we can convert a list of dictionaries to a Pandas DataFrame using 
#df = pd.DataFrame(list with dictionaries).
import pandas as pd

# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)
#Dataframe in 6.3.1 is not showing up

In [None]:
#Recall that to reorder the columns, we assign a variable to an array of the columns in the order 
#we want them to appear:

new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]

#Then, we assign a new or the same DataFrame with new column order:

city_data_df = city_data_df[new_column_order]
city_data_df

In [None]:
#The last line in the code block will export the DataFrame to a CSV file, with the index label (or column A) 
#header as "City_ID." If we ever need to export the CSV file to a DataFrame, that header will be present in the DataFrame.

# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")

#We've completed our tasks for making API calls, parsing the response, and collecting the data for our project

In [None]:
#gitignor in module 6.2.7

In [None]:
#Getting Data for Plotting

# Extract relevant fields from the DataFrame for plotting.
lats = city_data_df["Lat"]
max_temps = city_data_df["Max Temp"]
humidity = city_data_df["Humidity"]
cloudiness = city_data_df["Cloudiness"]
wind_speed = city_data_df["Wind Speed"]

In [None]:
# Import time module
import time

# Build the scatter plot for latitude vs. max temperature.
plt.scatter(lats,
            max_temps,
            edgecolor="black", linewidths=1, marker="o",
            alpha=0.8, label="Cities")

# Incorporate the other graph properties.
plt.title(f"City Latitude vs. Max Temperature "+ time.strftime("%x"))
plt.ylabel("Max Temperature (F)")
plt.xlabel("Latitude")
plt.grid(True)

# Save the figure.
plt.savefig("weather_data/Fig1.png")

# Show plot.
plt.show()

In [None]:
#the code to create a scatter plot for latitude versus humidity. 
plt.scatter(lats, humidity, edgecolor="black", linewidths=1, marker="o", alpha=0.8, label="Cities")

# Incorporate the other graph properties.
plt.title(f"City Latitude vs. Humidity "+ time.strftime("%x"))
plt.ylabel("Humidity (%)")
plt.xlabel("Latitude")
plt.grid(True)

# Save the figure.
plt.savefig("weather_data/Fig2.png")

# Show plot.
plt.show()

In [None]:
#refactor the code for our scatter plots by changing the y-axis variable to "cloudiness," 
#the title to "Cloudiness (%)," and the y-axis label to "Cloudiness (%)."

In [None]:
# Build the scatter plots for latitude vs. cloudiness.
plt.scatter(lats,
            cloudiness,
            edgecolor="black", linewidths=1, marker="o",
            alpha=0.8, label="Cities")

# Incorporate the other graph properties.
plt.title(f"City Latitude vs. Cloudiness (%) "+ time.strftime("%x"))
plt.ylabel("Cloudiness (%)")
plt.xlabel("Latitude")
plt.grid(True)
# Save the figure.
plt.savefig("weather_data/Fig3.png")
# Show plot.
plt.show()

In [None]:
#Let's repurpose the code we have been using and change the y-axis variable to "wind speed," 
#the title to "Wind Speed," and the y-axis label to "Wind Speed (mph)."

In [None]:
# Build the scatter plots for latitude vs. wind speed.
plt.scatter(lats,
            wind_speed,
            edgecolor="black", linewidths=1, marker="o",
            alpha=0.8, label="Cities")

# Incorporate the other graph properties.
plt.title(f"City Latitude vs. Wind Speed "+ time.strftime("%x"))
plt.ylabel("Wind Speed (mph)")
plt.xlabel("Latitude")
plt.grid(True)
# Save the figure.
plt.savefig("weather_data/Fig4.png")
# Show plot.
plt.show()

In [None]:
# Create a function to create perform linear regression on the weather data
# and plot a regression line and the equation with the data.
def plot_linear_regression(x_values, y_values, title, y_label, text_coordinates):
