In [1]:
# Import the dependencies
import pandas as pd
import requests
import numpy as np
from citipy import citipy


# Import the API keys
from config import weather_api_key

In [2]:
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [3]:
# Create a set of random latitude and longitude combinations
lats = np.random.uniform(low = -90.000, high= 90.000, size=100)
lngs = np.random.uniform(low = -180.000, high= 180.000, size=100)
lat_lngs = zip(lats,lngs)
lat_lngs

<zip at 0x1c635faf788>

In [4]:
# Add the latitudes and longitudes to a list
coordinates = list(lat_lngs)

In [5]:
# Create a list for holding the cities
cities = []

# Identify the nearest city for each lat and long combo
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is uniqe, then we will add it to the cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

87

# Psuedocode
1. Create 1st retrieval -> capture latitude and longitude, maximum temperature, percent humidity, percent cloudiness, wind speed, weather description
    -create DataFrame1 with new list, ensuring city
2. Create 2nd retrieval -> if same coordinates has rain, fetch rain, else add zer0
    -create DataFrame2 with new list, ensuring city
3. Create 3rd retrieval -> if same coordinates has snow, fetch snow, else add zer0
    -create DataFrame3 with new list, ensuring city
4. Join all three DataFrames on city
    a. Join DataFrame1 and DataFrame2 as DataFrameX
    b. Join DataFrameX and DataFrame3 as DataFrame
5. Write file as CSV, answer the question using Panda methods: How many cities have recorded rainfall or snow?

In [6]:
# Create an empty list to hold the weather data
city_data1 = []

# Print the beginning of the logging
print(" .xX-> RETRIEVAL OF DATA1 HAS COMMENCED <-Xx. ")
print("---------------------------------------------")

# Create counters
record_count = 1
set_count = 1

 .xX-> RETRIEVAL OF DATA1 HAS COMMENCED <-Xx. 
---------------------------------------------


In [7]:
# Loop through all the cities in our list
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    
    # Create endpoint URL with each city
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the URL, record, and set numbers and the city
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    
    # Add 1 to the record count
    record_count +=1
    
    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        city_description = city_weather["weather"][0]["description"]
           
        # Append the city information into city_data list
        city_data1.append({"City": city.title(),
                          "Country": city_country,
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Current Description": city_description
                         })

# if an error is experienced, skip the city
    except:
        print("No city we found, move on we must...")
        pass
    
# Indicate that Data Loading is complete
print("---------------------------------------------")
print(" .xX-> RETRIEVAL OF DATA1 HAS COMPLETED <-Xx. ")
print("---------------------------------------------")      

Processing Record 1 of Set 1 | inhambane
Processing Record 2 of Set 1 | karpathos
Processing Record 3 of Set 1 | busselton
Processing Record 4 of Set 1 | ambilobe
Processing Record 5 of Set 1 | port-gentil
Processing Record 6 of Set 1 | ushuaia
Processing Record 7 of Set 1 | tuktoyaktuk
Processing Record 8 of Set 1 | esperance
Processing Record 9 of Set 1 | port macquarie
Processing Record 10 of Set 1 | sola
Processing Record 11 of Set 1 | hofn
Processing Record 12 of Set 1 | lata
Processing Record 13 of Set 1 | airai
Processing Record 14 of Set 1 | aklavik
Processing Record 15 of Set 1 | yellowknife
Processing Record 16 of Set 1 | ivanishchi
Processing Record 17 of Set 1 | reykjavik
Processing Record 18 of Set 1 | atuona
Processing Record 19 of Set 1 | nouadhibou
Processing Record 20 of Set 1 | mataura
Processing Record 21 of Set 1 | lorengau
Processing Record 22 of Set 1 | fortuna
Processing Record 23 of Set 1 | balgazyn
Processing Record 24 of Set 1 | kahului
Processing Record 25 of

In [8]:
# Print city_data to confirm sufficient count
len(city_data1)

77

In [9]:
# Convert the array of dictionaries to a Pandas DataFrame
city_data1_df = pd.DataFrame(city_data1)

# Create the output .csv file
output_data_file1 = "weather_database/DataFrame1.csv"

# Export the city_data1 into a csv
city_data1_df.to_csv(output_data_file1, index_label="City_ID")

In [10]:
# Create an empty list to hold the weather data
city_data2 = []

# Print the beginning of the logging
print(" .xX-> RETRIEVAL OF DATA2 HAS COMMENCED <-Xx. ")
print("---------------------------------------------")

# Create counters
record_count = 1
set_count = 1

 .xX-> RETRIEVAL OF DATA2 HAS COMMENCED <-Xx. 
---------------------------------------------


In [11]:
# Loop through all the cities in our list
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    
    # Create endpoint URL with each city
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the URL, record, and set numbers and the city
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    
    # Add 1 to the record count
    record_count +=1
    
    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
       
        # Parse out the needed data - 3h.
        city_rain = city_weather["rain"]["3h"]
    
        # Append the rain information into city_data2 list
        city_data2.append({"City": city.title(),
                           "Rain (Inches)": city_rain
                           })
    except:    
        try:
            # Parse the JSON and retrieve data.
            city_weather = requests.get(city_url).json()
       
            # Parse out the needed data - 3h.
            city_rain = city_weather["rain"]["1h"]
            
             # Append the rain information into city_data2 list
            city_data2.append({"City": city.title(),
                               "Rain (Inches)": city_rain
                               })
    
        except:
             # Parse the JSON and retrieve data.
            city_weather = requests.get(city_url).json()
       
            # Append the rain information into city_data2 list
            city_data2.append({"City": city.title(),
                              "Rain (Inches)": 0
                              })
    
    pass
    
# Indicate that Data Loading is complete
print("---------------------------------------------")
print(" .xX-> RETRIEVAL OF DATA2 HAS COMPLETED <-Xx. ")
print("---------------------------------------------")   

Processing Record 1 of Set 1 | inhambane
Processing Record 2 of Set 1 | karpathos
Processing Record 3 of Set 1 | busselton
Processing Record 4 of Set 1 | ambilobe
Processing Record 5 of Set 1 | port-gentil
Processing Record 6 of Set 1 | ushuaia
Processing Record 7 of Set 1 | tuktoyaktuk
Processing Record 8 of Set 1 | esperance
Processing Record 9 of Set 1 | port macquarie
Processing Record 10 of Set 1 | sola
Processing Record 11 of Set 1 | hofn
Processing Record 12 of Set 1 | lata
Processing Record 13 of Set 1 | airai
Processing Record 14 of Set 1 | aklavik
Processing Record 15 of Set 1 | yellowknife
Processing Record 16 of Set 1 | ivanishchi
Processing Record 17 of Set 1 | reykjavik
Processing Record 18 of Set 1 | atuona
Processing Record 19 of Set 1 | nouadhibou
Processing Record 20 of Set 1 | mataura
Processing Record 21 of Set 1 | lorengau
Processing Record 22 of Set 1 | fortuna
Processing Record 23 of Set 1 | balgazyn
Processing Record 24 of Set 1 | kahului
Processing Record 25 of

In [12]:
# Print city_data to confirm sufficient count
len(city_data2)

87

In [13]:
# Convert the array of dictionaries to a Pandas DataFrame
city_data2_df = pd.DataFrame(city_data2)

# Create the output .csv file
output_data_file2 = "weather_database/DataFrame2.csv"

# Export the city_data1 into a csv
city_data2_df.to_csv(output_data_file2, index_label="City_ID")

In [14]:
# Create an empty list to hold the weather data
city_data3 = []

# Print the beginning of the logging
print(" .xX-> RETRIEVAL OF DATA3 HAS COMMENCED <-Xx. ")
print("---------------------------------------------")

# Create counters
record_count = 1
set_count = 1

 .xX-> RETRIEVAL OF DATA3 HAS COMMENCED <-Xx. 
---------------------------------------------


In [15]:
# Loop through all the cities in our list
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    
    # Create endpoint URL with each city
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the URL, record, and set numbers and the city
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    
    # Add 1 to the record count
    record_count +=1
    
    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
       
        # Parse out the needed data - 3h.
        city_snow = city_weather["snow"]["3h"]
    
        # Append the rain information into city_data2 list
        city_data3.append({"City": city.title(),
                           "Snow (Inches)": city_snow
                           })
    except:    
        try:
            # Parse the JSON and retrieve data.
            city_weather = requests.get(city_url).json()
       
            # Parse out the needed data - 3h.
            city_snow = city_weather["snow"]["1h"]
            
             # Append the rain information into city_data2 list
            city_data3.append({"City": city.title(),
                               "Snow (Inches)": city_snow
                               })
    
        except:
             # Parse the JSON and retrieve data.
            city_weather = requests.get(city_url).json()
       
            # Append the rain information into city_data2 list
            city_data3.append({"City": city.title(),
                              "Snow (Inches)": 0
                              })
    
    pass
    
# Indicate that Data Loading is complete
print("---------------------------------------------")
print(" .xX-> RETRIEVAL OF DATA3 HAS COMPLETED <-Xx. ")
print("---------------------------------------------")   

Processing Record 1 of Set 1 | inhambane
Processing Record 2 of Set 1 | karpathos
Processing Record 3 of Set 1 | busselton
Processing Record 4 of Set 1 | ambilobe
Processing Record 5 of Set 1 | port-gentil
Processing Record 6 of Set 1 | ushuaia
Processing Record 7 of Set 1 | tuktoyaktuk
Processing Record 8 of Set 1 | esperance
Processing Record 9 of Set 1 | port macquarie
Processing Record 10 of Set 1 | sola
Processing Record 11 of Set 1 | hofn
Processing Record 12 of Set 1 | lata
Processing Record 13 of Set 1 | airai
Processing Record 14 of Set 1 | aklavik
Processing Record 15 of Set 1 | yellowknife
Processing Record 16 of Set 1 | ivanishchi
Processing Record 17 of Set 1 | reykjavik
Processing Record 18 of Set 1 | atuona
Processing Record 19 of Set 1 | nouadhibou
Processing Record 20 of Set 1 | mataura
Processing Record 21 of Set 1 | lorengau
Processing Record 22 of Set 1 | fortuna
Processing Record 23 of Set 1 | balgazyn
Processing Record 24 of Set 1 | kahului
Processing Record 25 of

In [16]:
# Print city_data to confirm sufficient count
len(city_data3)

87

In [17]:
# Convert the array of dictionaries to a Pandas DataFrame
city_data3_df = pd.DataFrame(city_data3)

# Create the output .csv file
output_data_file3 = "weather_database/DataFrame3.csv"

# Export the city_data1 into a csv
city_data3_df.to_csv(output_data_file3, index_label="City_ID")