In [1]:
# import dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy


In [2]:
# create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)

In [3]:
# add the latitudes and logitudes to a list
coordinates = list(lat_lngs)

In [4]:
# Create a list for holding the cities
cities=[]
# Identify the nearest city for each latitude and longitude combination
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list
    if city not in cities:
        cities.append(city)
# print the city count to confirm sufficient count.
len(cities)

597

In [5]:
# import the requests library
import requests

# import the API key
from config import weather_api_key

In [6]:
# Starting URL for weather map API call
url = "http://api.openweathermap.org/data/2.5/weather?unites=Imperial&APPID=" + weather_api_key
print(url)

http://api.openweathermap.org/data/2.5/weather?unites=Imperial&APPID=0132a1a5560f78db4653dca3b1034416


In [7]:
# Create an endpoint URL for a city
city_url = url + "&q=" + "Boston"
city_weather = requests.get(city_url)
city_weather.json()

{'coord': {'lon': -71.0598, 'lat': 42.3584},
 'weather': [{'id': 803,
   'main': 'Clouds',
   'description': 'broken clouds',
   'icon': '04d'}],
 'base': 'stations',
 'main': {'temp': 277.08,
  'feels_like': 273.68,
  'temp_min': 275.45,
  'temp_max': 278.68,
  'pressure': 1008,
  'humidity': 56},
 'visibility': 10000,
 'wind': {'speed': 4.02, 'deg': 311, 'gust': 8.49},
 'clouds': {'all': 75},
 'dt': 1638211511,
 'sys': {'type': 2,
  'id': 2013408,
  'country': 'US',
  'sunrise': 1638186725,
  'sunset': 1638220417},
 'timezone': -18000,
 'id': 4930956,
 'name': 'Boston',
 'cod': 200}

In [8]:
# Get the JSON data.
boston_data = city_weather.json()

In [9]:
boston_data['sys']['country']

'US'

In [10]:
boston_data['dt']

1638211511

In [11]:
lat = boston_data['coord']['lat']
lon = boston_data['coord']['lon']
max_temp = boston_data['main']['temp_max']
min_temp = boston_data['main']['temp_min']
humidity = boston_data['main']['humidity']
clouds = boston_data['clouds']['all']
wind = boston_data['wind']['speed']
print(lat, lon, max_temp, min_temp, humidity, clouds, wind)

42.3584 -71.0598 278.68 275.45 56 75 4.02


In [12]:
# Import the time library and the datetime module from the datetime library
import time
from datetime import datetime

In [13]:
# Initialize counters and an empty list that will hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval    ")
print("----------------------------")

Beginning Data Retrieval    
----------------------------


In [14]:
# Create counters
record_count = 1
set_count = 1

In [15]:
# Loop through the cities list.
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)
        
    # Create endpoint url with each city.
    city_url = url + "&q=" + city.replace(" ", "+")
    
    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
# Run an API request for each of the cities:
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse Out the needed data.
        city_lat = city_weather['coord']['lat']
        city_lng = city_weather['coord']['lon']
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y, %m, %d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                         "Lat": city_lat,
                         "Lng": city_lng,
                         "Max Temp": city_max_temp,
                         "Humidity": city_humidity,
                         "Cloudiness": city_clouds,
                         "Wind Speed": city_wind,
                         "Country": city_country,
                         "Date": city_date})
# If an error is experienced, skip the city
    except:
        print("City not found. Skipping...")
        pass
    
# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Processing Record 1 of Set 1 | carnarvon
Processing Record 2 of Set 1 | acapulco
Processing Record 3 of Set 1 | barrow
Processing Record 4 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 5 of Set 1 | vaini
Processing Record 6 of Set 1 | bethel
Processing Record 7 of Set 1 | esperance
Processing Record 8 of Set 1 | mana
Processing Record 9 of Set 1 | bluff
Processing Record 10 of Set 1 | upernavik
Processing Record 11 of Set 1 | pevek
Processing Record 12 of Set 1 | rikitea
Processing Record 13 of Set 1 | airai
Processing Record 14 of Set 1 | port elizabeth
Processing Record 15 of Set 1 | busselton
Processing Record 16 of Set 1 | namibe
Processing Record 17 of Set 1 | phangnga
Processing Record 18 of Set 1 | cape town
Processing Record 19 of Set 1 | saskylakh
Processing Record 20 of Set 1 | kapaa
Processing Record 21 of Set 1 | zhigansk
Processing Record 22 of Set 1 | xining
Processing Record 23 of Set 1 | mount gambier
Processing Record 24 of Set 1 | ushuaia
Processi

Processing Record 38 of Set 4 | haines junction
Processing Record 39 of Set 4 | batticaloa
Processing Record 40 of Set 4 | guerrero negro
Processing Record 41 of Set 4 | grand gaube
Processing Record 42 of Set 4 | mahibadhoo
Processing Record 43 of Set 4 | kazalinsk
City not found. Skipping...
Processing Record 44 of Set 4 | castro
Processing Record 45 of Set 4 | dudinka
Processing Record 46 of Set 4 | fallon
Processing Record 47 of Set 4 | barbar
City not found. Skipping...
Processing Record 48 of Set 4 | cedar city
Processing Record 49 of Set 4 | axim
Processing Record 50 of Set 4 | simnas
Processing Record 1 of Set 5 | tabou
Processing Record 2 of Set 5 | kijang
Processing Record 3 of Set 5 | riyadh
Processing Record 4 of Set 5 | turukhansk
Processing Record 5 of Set 5 | ponta delgada
Processing Record 6 of Set 5 | samarai
Processing Record 7 of Set 5 | sai buri
Processing Record 8 of Set 5 | troy
Processing Record 9 of Set 5 | weston
Processing Record 10 of Set 5 | udachnyy
Process

Processing Record 29 of Set 8 | port hedland
Processing Record 30 of Set 8 | svetlyy
Processing Record 31 of Set 8 | rodrigues alves
Processing Record 32 of Set 8 | penticton
Processing Record 33 of Set 8 | yulara
Processing Record 34 of Set 8 | alirajpur
Processing Record 35 of Set 8 | awbari
Processing Record 36 of Set 8 | curup
Processing Record 37 of Set 8 | yerbogachen
Processing Record 38 of Set 8 | agbor
Processing Record 39 of Set 8 | rungata
City not found. Skipping...
Processing Record 40 of Set 8 | balabac
Processing Record 41 of Set 8 | mayo
Processing Record 42 of Set 8 | bauchi
Processing Record 43 of Set 8 | robinson
Processing Record 44 of Set 8 | svetlogorsk
Processing Record 45 of Set 8 | pedernales
Processing Record 46 of Set 8 | ilulissat
Processing Record 47 of Set 8 | hudiksvall
Processing Record 48 of Set 8 | perth
Processing Record 49 of Set 8 | toamasina
Processing Record 50 of Set 8 | beckley
Processing Record 1 of Set 9 | carthage
Processing Record 2 of Set 9

Processing Record 18 of Set 12 | kolokani
Processing Record 19 of Set 12 | maracaju
Processing Record 20 of Set 12 | lentekhi
Processing Record 21 of Set 12 | manado
Processing Record 22 of Set 12 | leningradskiy
Processing Record 23 of Set 12 | kisangani
Processing Record 24 of Set 12 | filingue
Processing Record 25 of Set 12 | port-gentil
Processing Record 26 of Set 12 | urusha
Processing Record 27 of Set 12 | rio gallegos
Processing Record 28 of Set 12 | ust-nera
Processing Record 29 of Set 12 | santa maria do para
Processing Record 30 of Set 12 | jalu
Processing Record 31 of Set 12 | basco
Processing Record 32 of Set 12 | mangrol
Processing Record 33 of Set 12 | tommot
Processing Record 34 of Set 12 | chimore
Processing Record 35 of Set 12 | cuamba
Processing Record 36 of Set 12 | noumea
Processing Record 37 of Set 12 | agropoli
Processing Record 38 of Set 12 | prudy
Processing Record 39 of Set 12 | ramsar
Processing Record 40 of Set 12 | thinadhoo
Processing Record 41 of Set 12 | 

In [16]:
# Convert the array of dictionaries to a Pandas DataFrame
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Carnarvon,-24.8667,113.6333,295.19,78,0,9.26,AU,"2021, 11, 29 18:45:35"
1,Acapulco,16.8634,-99.8901,303.05,66,1,2.57,MX,"2021, 11, 29 18:42:32"
2,Barrow,71.2906,-156.7887,245.16,69,1,3.6,US,"2021, 11, 29 18:42:51"
3,Vaini,-21.2,-175.2,298.24,78,40,5.14,TO,"2021, 11, 29 18:45:16"
4,Bethel,41.3712,-73.414,278.18,68,75,0.45,US,"2021, 11, 29 18:45:13"
5,Esperance,-33.8667,121.9,287.06,72,100,5.25,AU,"2021, 11, 29 18:47:07"
6,Mana,5.6592,-53.7767,301.29,74,88,3.99,GF,"2021, 11, 29 18:47:08"
7,Bluff,-46.6,168.3333,286.93,80,100,4.61,NZ,"2021, 11, 29 18:47:08"
8,Upernavik,72.7868,-56.1549,267.22,96,100,2.79,GL,"2021, 11, 29 18:47:09"
9,Pevek,69.7008,170.3133,256.3,96,100,1.66,RU,"2021, 11, 29 18:47:09"


In [17]:
# Reorder the columns to make it easier to read
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_column_order]
city_data_df.head()

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Carnarvon,AU,"2021, 11, 29 18:45:35",-24.8667,113.6333,295.19,78,0,9.26
1,Acapulco,MX,"2021, 11, 29 18:42:32",16.8634,-99.8901,303.05,66,1,2.57
2,Barrow,US,"2021, 11, 29 18:42:51",71.2906,-156.7887,245.16,69,1,3.6
3,Vaini,TO,"2021, 11, 29 18:45:16",-21.2,-175.2,298.24,78,40,5.14
4,Bethel,US,"2021, 11, 29 18:45:13",41.3712,-73.414,278.18,68,75,0.45


In [18]:
# Create the output file (csv)
output_data_file = "weather_data/cities.csv"
# export the city_data into a csv.
city_data_df.to_csv(output_data_file, index_label="City_ID")