In [1]:
# Import dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [2]:
# Deliverable 1.3
# Create a set of 2,000 random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=2000)
lngs = np.random.uniform(low=-180.000, high=180.000, size=2000)
lat_lngs = zip(lats, lngs)

In [3]:
# Add the latitudes and longitudes to a list
coordinates = list(lat_lngs)

In [4]:
from citipy import citipy

In [5]:
# Deliverable 1.4
# Create a list for holding the cities.
cities = []

# Identify the nearest city for each lat/lng combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, we will add it to the cities list.
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

757

In [6]:
# Deliverable 1.5
# Import the API key
from config import weather_api_key

# Import the requests library
import requests

# Starting URL for Weather Map API call
url = "http://api.openweathermap.org/data/2.5/weather?units=IMPERIAL&APPID=" + weather_api_key

# Import the time library and the datetime module from the datetime library
import time
from datetime import datetime

In [7]:
# Deliverable 1.6
# Create an empty list to hold the weather data.
city_data = []

# Print the beginning of the logging.
print("Beginning Data Retrieval.    ")
print("-----------------------------")

# Create counters
record_count = 1
set_count = 1

# Loop through all the cities in our list.
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)
        
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the url, record, and set numbers and the city.
    print(f'Processing Record {record_count} of Set {set_count} | {city}')
    
    #Add 1 to the record count.
    record_count += 1
    
    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data
        city_weather = requests.get(city_url).json()
        # Parse out the needed data
        city_lat = city_weather['coord']['lat']
        city_lng = city_weather['coord']['lon']
        city_max_temp = city_weather['main']['temp_max']
        city_humidity = city_weather['main']['humidity']
        city_clouds = city_weather['clouds']['all']
        city_wind = city_weather['wind']['speed']
        city_desc = str(city_weather['weather'][0]['description'])
        city_country = city_weather['sys']['country']
        # Convert the date to ISO standard
        city_date = datetime.utcfromtimestamp(city_weather['dt']).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into the city_data list
        city_data.append({'City': city.title(),
                          'Lat': city_lat,
                          'Lng': city_lng,
                          'Max Temp': city_max_temp,
                          'Humidity': city_humidity,
                          'Cloudiness': city_clouds,
                          'Wind Speed': city_wind,
                          'Weather Description': city_desc,
                          'Country': city_country,
                          'Date': city_date})

    #If an error is experienced, skip the city
    except:
        print('City not found. Skipping...')
        pass
    
# Indicate that Data Loading is complete.
print('-----------------------------')
print('Data Retrieval Complete      ')
print('-----------------------------')
    



Beginning Data Retrieval.    
-----------------------------
Processing Record 1 of Set 1 | ushuaia
Processing Record 2 of Set 1 | punta arenas
Processing Record 3 of Set 1 | avarua
Processing Record 4 of Set 1 | hobart
Processing Record 5 of Set 1 | lasa
Processing Record 6 of Set 1 | aljezur
Processing Record 7 of Set 1 | albany
Processing Record 8 of Set 1 | carnarvon
Processing Record 9 of Set 1 | te anau
Processing Record 10 of Set 1 | tsihombe
City not found. Skipping...
Processing Record 11 of Set 1 | saint-philippe
Processing Record 12 of Set 1 | puerto ayora
Processing Record 13 of Set 1 | georgetown
Processing Record 14 of Set 1 | mbaiki
Processing Record 15 of Set 1 | foam lake
Processing Record 16 of Set 1 | arraial do cabo
Processing Record 17 of Set 1 | upernavik
Processing Record 18 of Set 1 | barrow
Processing Record 19 of Set 1 | rikitea
Processing Record 20 of Set 1 | cape town
Processing Record 21 of Set 1 | vaini
Processing Record 22 of Set 1 | yanchukan
City not fou

In [8]:
# Tally number of cities
len(city_data)

696

In [9]:
# Convert the array of dictionaries to a Pandas DataFrame
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Weather Description,Country,Date
0,Ushuaia,-54.8,-68.3,49.66,46,20,21.85,few clouds,AR,2022-05-07 21:59:35
1,Punta Arenas,-53.15,-70.9167,48.31,71,20,23.02,few clouds,CL,2022-05-07 21:59:36
2,Avarua,-21.2078,-159.775,80.53,74,100,5.3,overcast clouds,CK,2022-05-07 21:59:36
3,Hobart,-42.8794,147.3294,53.46,82,75,12.66,broken clouds,AU,2022-05-07 21:58:07
4,Lasa,46.6166,10.7002,50.36,95,100,2.75,overcast clouds,IT,2022-05-07 21:59:37
5,Aljezur,37.3191,-8.8033,59.4,81,14,6.55,few clouds,PT,2022-05-07 21:59:38
6,Albany,42.6001,-73.9662,58.46,33,100,9.62,overcast clouds,US,2022-05-07 21:59:38
7,Carnarvon,-24.8667,113.6333,62.67,82,75,5.75,broken clouds,AU,2022-05-07 21:56:19
8,Te Anau,-45.4167,167.7167,57.0,96,100,2.24,overcast clouds,NZ,2022-05-07 21:59:39
9,Saint-Philippe,-21.3585,55.7679,72.99,83,33,10.87,light rain,RE,2022-05-07 21:53:11


In [10]:
new_column_order = ['City', 'Country', 'Date','Lat','Lng','Max Temp','Humidity','Cloudiness','Wind Speed', 'Weather Description']
city_data_df = city_data_df[new_column_order]
city_data_df.head()

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Weather Description
0,Ushuaia,AR,2022-05-07 21:59:35,-54.8,-68.3,49.66,46,20,21.85,few clouds
1,Punta Arenas,CL,2022-05-07 21:59:36,-53.15,-70.9167,48.31,71,20,23.02,few clouds
2,Avarua,CK,2022-05-07 21:59:36,-21.2078,-159.775,80.53,74,100,5.3,overcast clouds
3,Hobart,AU,2022-05-07 21:58:07,-42.8794,147.3294,53.46,82,75,12.66,broken clouds
4,Lasa,IT,2022-05-07 21:59:37,46.6166,10.7002,50.36,95,100,2.75,overcast clouds


In [11]:
# Create the output file (CSV).
output_data_file = 'Weather_Database/cities.csv'

# Export city_data into CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")