In [1]:
# Import the dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [2]:
# Create a set of random latitude adn longitude combinations
lats = np.random.uniform(low = -90.000, high = 90.000, size = 1500)
lngs = np.random.uniform(low = -180.000, high = 180.000, size = 1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7f817c73a600>

In [3]:
# Import from Citipy dependency.
from citipy import citipy

In [4]:
# Add the latitudes and longitudes to a list. 
coordinates = list(lat_lngs)

In [5]:
# Create a list for holding the cities. 
cities = []

# Identify the nearest city for each latitude and longitude combination. 
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list. 
    if city not in cities:
        cities.append(city)
        
# Print the city count to confirm sufficient count. 
len(cities)

636

In [6]:
# Import the API key.
from config import weather_api_key

In [7]:
# Starting URL for Weather Map API Call. 
url = 'http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=' + weather_api_key

In [8]:
# Import the time library and the datetime module from the datetime library
import time
from datetime import datetime

In [9]:
# Import the requests Library. 
import requests

# Import the API key.
from config import weather_api_key

In [10]:
# Create an empty list to hold the weather data. 
city_data = []

#Print the beginning of the logging. 
print ('Beginning Data Retrieval     ')
print ('-----------------------------')

# Create Counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):
    
    #Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep (60)
        
    #Create Endpoint url with each city. 
    city_url = url + '&q=' + city.replace (' ', '+')
    
    # Log the URL, record, and set numbers and the city. 
    print (f'Processing Record {record_count} of Set {set_count} | {city}')
    # Add 1 to the record count. 
    record_count += 1
    
    # Run an API request for each of the cities. 
    try: 
    
        # Parse the JSON and retrieve the data. 
        city_weather = requests.get (city_url).json()

        # Parse out the needed data. 
        city_lat = city_weather['coord']['lat']
        city_lng = city_weather['coord']['lon']
        city_max_temp = city_weather['main']['temp_max']
        city_humidity = city_weather['main']['humidity']
        city_clouds = city_weather['clouds']['all']
        city_wind = city_weather['wind']['speed']
        city_country = city_weather['sys']['country']

        # Convert the date to ISO standard. 
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')

        # Append the city information into city_data list. 
        city_data.append({'City' : city.title(),
                          'Lat' : city_lat,
                          'Lng' : city_lng,
                          'Max Temp' : city_max_temp,
                          'Humidity' : city_humidity,
                          'Cloudiness' : city_clouds,
                          'Wind Speed' : city_wind,
                          'Country' : city_country,
                          'Date': city_date})
        
# If an error is experienced, skip the city. 
    except:
        print ('City not found. Skipping...')
        pass

# Indicate the data loading is complete.
print ('-----------------------------')
print ('Data Retrieval Complete      ')
print ('-----------------------------')

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | mahebourg
Processing Record 2 of Set 1 | ushuaia
Processing Record 3 of Set 1 | ribeira grande
Processing Record 4 of Set 1 | lebedyn
Processing Record 5 of Set 1 | quatre cocos
Processing Record 6 of Set 1 | sete
Processing Record 7 of Set 1 | busselton
Processing Record 8 of Set 1 | vaini
Processing Record 9 of Set 1 | sao joao da barra
Processing Record 10 of Set 1 | tessalit
Processing Record 11 of Set 1 | kabo
Processing Record 12 of Set 1 | tezu
Processing Record 13 of Set 1 | sentyabrskiy
City not found. Skipping...
Processing Record 14 of Set 1 | bengkulu
Processing Record 15 of Set 1 | upernavik
Processing Record 16 of Set 1 | rikitea
Processing Record 17 of Set 1 | hamilton
Processing Record 18 of Set 1 | deputatskiy
Processing Record 19 of Set 1 | barrow
Processing Record 20 of Set 1 | avarua
Processing Record 21 of Set 1 | kapaa
Processing Record 22 of Set 1 | hobart
Processing Record

Processing Record 41 of Set 4 | mangla
Processing Record 42 of Set 4 | marsabit
Processing Record 43 of Set 4 | makakilo city
Processing Record 44 of Set 4 | kazalinsk
City not found. Skipping...
Processing Record 45 of Set 4 | san jose
Processing Record 46 of Set 4 | salatiga
Processing Record 47 of Set 4 | clovis
Processing Record 48 of Set 4 | la plata
Processing Record 49 of Set 4 | provideniya
Processing Record 50 of Set 4 | staroutkinsk
Processing Record 1 of Set 5 | luang prabang
Processing Record 2 of Set 5 | sunrise manor
Processing Record 3 of Set 5 | vila franca do campo
Processing Record 4 of Set 5 | leh
Processing Record 5 of Set 5 | katsuura
Processing Record 6 of Set 5 | lagoa
Processing Record 7 of Set 5 | hovd
Processing Record 8 of Set 5 | barth
Processing Record 9 of Set 5 | pangkalanbuun
Processing Record 10 of Set 5 | yeletskiy
City not found. Skipping...
Processing Record 11 of Set 5 | conde
Processing Record 12 of Set 5 | khorixas
Processing Record 13 of Set 5 | 

Processing Record 25 of Set 8 | gilgit
Processing Record 26 of Set 8 | dosso
Processing Record 27 of Set 8 | zhanaozen
Processing Record 28 of Set 8 | praya
Processing Record 29 of Set 8 | jega
Processing Record 30 of Set 8 | saint-augustin
Processing Record 31 of Set 8 | baruun-urt
Processing Record 32 of Set 8 | alice springs
Processing Record 33 of Set 8 | itatskiy
Processing Record 34 of Set 8 | paciran
Processing Record 35 of Set 8 | berbera
Processing Record 36 of Set 8 | honiara
Processing Record 37 of Set 8 | progreso
Processing Record 38 of Set 8 | nizhniy kuranakh
Processing Record 39 of Set 8 | nemuro
Processing Record 40 of Set 8 | shache
Processing Record 41 of Set 8 | buchanan
Processing Record 42 of Set 8 | marsa matruh
Processing Record 43 of Set 8 | gorom-gorom
Processing Record 44 of Set 8 | cambridge
Processing Record 45 of Set 8 | togur
Processing Record 46 of Set 8 | bubaque
Processing Record 47 of Set 8 | pimentel
Processing Record 48 of Set 8 | kharp
Processing R

Processing Record 13 of Set 12 | evensk
Processing Record 14 of Set 12 | doctor arroyo
Processing Record 15 of Set 12 | sorong
Processing Record 16 of Set 12 | olinda
Processing Record 17 of Set 12 | sangar
Processing Record 18 of Set 12 | khromtau
Processing Record 19 of Set 12 | chingirlau
Processing Record 20 of Set 12 | saryg-sep
Processing Record 21 of Set 12 | margate
Processing Record 22 of Set 12 | merke
Processing Record 23 of Set 12 | kovdor
Processing Record 24 of Set 12 | george town
Processing Record 25 of Set 12 | college
Processing Record 26 of Set 12 | carauari
Processing Record 27 of Set 12 | trairi
Processing Record 28 of Set 12 | katherine
Processing Record 29 of Set 12 | gold coast
Processing Record 30 of Set 12 | rantepao
Processing Record 31 of Set 12 | khalkhal
Processing Record 32 of Set 12 | nanortalik
Processing Record 33 of Set 12 | richards bay
Processing Record 34 of Set 12 | kajaani
Processing Record 35 of Set 12 | hasaki
Processing Record 36 of Set 12 | o

In [11]:
# Convert the Array of dictionarie to a Pandas DataFrame. 
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Mahebourg,-20.4081,57.7,71.89,68,40,12.66,MU,2022-10-08 16:54:11
1,Ushuaia,-54.8,-68.3,47.82,76,100,8.05,AR,2022-10-08 16:52:32
2,Ribeira Grande,38.5167,-28.7,75.6,83,40,8.05,PT,2022-10-08 16:54:12
3,Lebedyn,50.5852,34.4849,51.91,68,13,6.44,UA,2022-10-08 16:54:12
4,Quatre Cocos,-20.2078,57.7625,71.71,69,45,16.44,MU,2022-10-08 16:54:12
5,Sete,43.4018,3.6966,71.64,78,100,6.4,FR,2022-10-08 16:54:13
6,Busselton,-33.65,115.3333,53.58,81,12,3.76,AU,2022-10-08 16:54:14
7,Vaini,-21.2,-175.2,71.76,94,100,14.97,TO,2022-10-08 16:54:14
8,Sao Joao Da Barra,-21.6403,-41.0511,80.69,71,61,16.58,BR,2022-10-08 16:54:17
9,Tessalit,20.1986,1.0114,99.41,11,14,12.95,ML,2022-10-08 16:54:17


In [12]:
# Reorder the columns
new_column_order = ['City', 'Country', 'Date', 'Lat', 'Lng', 'Max Temp','Humidity', 'Cloudiness', 'Wind Speed']
city_data_df = city_data_df[new_column_order]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Mahebourg,MU,2022-10-08 16:54:11,-20.4081,57.7,71.89,68,40,12.66
1,Ushuaia,AR,2022-10-08 16:52:32,-54.8,-68.3,47.82,76,100,8.05
2,Ribeira Grande,PT,2022-10-08 16:54:12,38.5167,-28.7,75.6,83,40,8.05
3,Lebedyn,UA,2022-10-08 16:54:12,50.5852,34.4849,51.91,68,13,6.44
4,Quatre Cocos,MU,2022-10-08 16:54:12,-20.2078,57.7625,71.71,69,45,16.44
5,Sete,FR,2022-10-08 16:54:13,43.4018,3.6966,71.64,78,100,6.4
6,Busselton,AU,2022-10-08 16:54:14,-33.65,115.3333,53.58,81,12,3.76
7,Vaini,TO,2022-10-08 16:54:14,-21.2,-175.2,71.76,94,100,14.97
8,Sao Joao Da Barra,BR,2022-10-08 16:54:17,-21.6403,-41.0511,80.69,71,61,16.58
9,Tessalit,ML,2022-10-08 16:54:17,20.1986,1.0114,99.41,11,14,12.95


In [13]:
# Create the output file (CSV)
output_data_file = 'weather_data/cities.csv'
# Export the City_Data into a CSV. 
city_data_df.to_csv(output_data_file, index_label="City_ID")