In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x1e7d7131448>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
# Use the citipy module to determine city based on latitude and longitude.
from citipy import citipy

In [5]:
# Use the tuple() function to display the latitude and longitude combinations.
for coordinate in coordinates:
    print(citipy.nearest_city(coordinate[0], coordinate[1]).city_name,
          citipy.nearest_city(coordinate[0], coordinate[1]).country_code)


kodiak us
albany au
castro cl
bredasdorp za
nanortalik gl
hambantota lk
arraial do cabo br
clonakilty ie
rikitea pf
rikitea pf
pandan ph
cape town za
rikitea pf
cidreira br
carnarvon au
general roca ar
dingle ie
busselton au
albany au
hobart au
punta arenas cl
punta arenas cl
butaritari ki
busselton au
hobart au
kununurra au
saint george bm
taolanaro mg
port alfred za
barrow us
new norfolk au
taolanaro mg
iqaluit ca
kapaa us
nalut ly
augusto correa br
higuey do
hobart au
sur om
port alfred za
qaanaaq gl
mataura pf
rikitea pf
illoqqortoormiut gl
talara pe
tilichiki ru
dubrovnik hr
vanimo pg
bonthe sl
torbay ca
karabuk tr
arraial do cabo br
lang suan th
kavieng pg
amderma ru
taolanaro mg
mar del plata ar
great yarmouth gb
georgetown sh
cape town za
praia da vitoria pt
port elizabeth za
byron bay au
alofi nu
clyde river ca
namibe ao
havoysund no
ushuaia ar
busselton au
jian cn
kapaa us
hermanus za
barrow us
puerto ayora ec
ushuaia ar
punta arenas cl
abu samrah qa
bluff nz
nouadhibou mr
sa

hermanus za
mar del plata ar
vaini to
yellowknife ca
ceska ves cz
jaciara br
lagoa pt
tsihombe mg
pita gn
mitzic ga
punta arenas cl
puerto ayora ec
andenes no
konza ke
katsina ng
albany au
tortoli it
punta arenas cl
ribeira grande pt
sydney au
saldanha za
vaini to
ribeira grande pt
rosarito mx
nikolskoye ru
tessalit ml
makakilo city us
sentyabrskiy ru
barrow us
at-bashi kg
jamestown sh
kenai us
ust-nera ru
saint anthony ca
port elizabeth za
santa rosa ar
tuatapere nz
punta arenas cl
asyut eg
jamestown sh
albany au
puerto carreno co
bredasdorp za
souillac mu
komsomolskiy ru
ushuaia ar
avarua ck
cape town za
manching de
numan ng
nanakuli us
pacific grove us
grindavik is
georgetown sh
ostrovnoy ru
kahului us
kamaishi jp
boa vista br
urdzhar kz
barentsburg sj
koygorodok ru
constitucion mx
bontang id
albany au
albany au
hasaki jp
manyana bw
hermanus za
hermanus za
pisco pe
belushya guba ru
albany au
zhengjiatun cn
umm kaddadah sd
barentsburg sj
vestmannaeyjar is
rikitea pf
bluff nz
ushuaia 

In [6]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

623

In [7]:
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

# Import the datetime module from the datetime library.
from datetime import datetime

In [8]:
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [9]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1

    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    
    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    
    # Add 1 to the record count.
    record_count += 1

    # Run an API request for each of the cities.
    try:
    
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

    # If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass


# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------") 

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | kodiak
Processing Record 2 of Set 1 | albany
Processing Record 3 of Set 1 | castro
Processing Record 4 of Set 1 | bredasdorp
Processing Record 5 of Set 1 | nanortalik
Processing Record 6 of Set 1 | hambantota
Processing Record 7 of Set 1 | arraial do cabo
Processing Record 8 of Set 1 | clonakilty
Processing Record 9 of Set 1 | rikitea
Processing Record 10 of Set 1 | pandan
Processing Record 11 of Set 1 | cape town
Processing Record 12 of Set 1 | cidreira
Processing Record 13 of Set 1 | carnarvon
Processing Record 14 of Set 1 | general roca
Processing Record 15 of Set 1 | dingle
Processing Record 16 of Set 1 | busselton
Processing Record 17 of Set 1 | hobart
Processing Record 18 of Set 1 | punta arenas
Processing Record 19 of Set 1 | butaritari
Processing Record 20 of Set 1 | kununurra
Processing Record 21 of Set 1 | saint george
Processing Record 22 of Set 1 | taolanaro
City not found. Skipping..

Processing Record 34 of Set 4 | sisimiut
Processing Record 35 of Set 4 | cubuk
Processing Record 36 of Set 4 | tepu
Processing Record 37 of Set 4 | bougouni
Processing Record 38 of Set 4 | sheridan
Processing Record 39 of Set 4 | manavalakurichi
Processing Record 40 of Set 4 | esfarayen
Processing Record 41 of Set 4 | stokmarknes
Processing Record 42 of Set 4 | hasaki
Processing Record 43 of Set 4 | marmaron
City not found. Skipping...
Processing Record 44 of Set 4 | radzyn podlaski
Processing Record 45 of Set 4 | longyearbyen
Processing Record 46 of Set 4 | port-gentil
Processing Record 47 of Set 4 | ust-kuyga
Processing Record 48 of Set 4 | bethel
Processing Record 49 of Set 4 | itaituba
Processing Record 50 of Set 4 | burnie
Processing Record 1 of Set 5 | aloleng
Processing Record 2 of Set 5 | turukhansk
Processing Record 3 of Set 5 | upernavik
Processing Record 4 of Set 5 | saskylakh
Processing Record 5 of Set 5 | ngawi
Processing Record 6 of Set 5 | pocone
Processing Record 7 of S

Processing Record 20 of Set 8 | itarema
Processing Record 21 of Set 8 | goundam
Processing Record 22 of Set 8 | gurgan
City not found. Skipping...
Processing Record 23 of Set 8 | sinnamary
Processing Record 24 of Set 8 | cabras
Processing Record 25 of Set 8 | tanout
Processing Record 26 of Set 8 | pemangkat
Processing Record 27 of Set 8 | faanui
Processing Record 28 of Set 8 | bokspits
City not found. Skipping...
Processing Record 29 of Set 8 | voh
Processing Record 30 of Set 8 | tessalit
Processing Record 31 of Set 8 | cantaura
Processing Record 32 of Set 8 | tuatapere
Processing Record 33 of Set 8 | grand gaube
Processing Record 34 of Set 8 | pampa
Processing Record 35 of Set 8 | angoram
Processing Record 36 of Set 8 | uyemskiy
Processing Record 37 of Set 8 | gillette
Processing Record 38 of Set 8 | norman wells
Processing Record 39 of Set 8 | bahia honda
Processing Record 40 of Set 8 | zhigalovo
Processing Record 41 of Set 8 | alvand
Processing Record 42 of Set 8 | sibolga
Processin

Processing Record 10 of Set 12 | cabo san lucas
Processing Record 11 of Set 12 | soyo
Processing Record 12 of Set 12 | fort-shevchenko
Processing Record 13 of Set 12 | dvorichna
Processing Record 14 of Set 12 | atambua
Processing Record 15 of Set 12 | akhmim
Processing Record 16 of Set 12 | fukue
Processing Record 17 of Set 12 | primorsk
Processing Record 18 of Set 12 | nome
Processing Record 19 of Set 12 | ciempozuelos
Processing Record 20 of Set 12 | guozhen
Processing Record 21 of Set 12 | hvide sande
Processing Record 22 of Set 12 | kopervik
Processing Record 23 of Set 12 | nchelenge
Processing Record 24 of Set 12 | thurso
Processing Record 25 of Set 12 | hefei
Processing Record 26 of Set 12 | batticaloa
Processing Record 27 of Set 12 | umm lajj
Processing Record 28 of Set 12 | mazamari
Processing Record 29 of Set 12 | tierra blanca
Processing Record 30 of Set 12 | wagar
Processing Record 31 of Set 12 | kopong
Processing Record 32 of Set 12 | tura
Processing Record 33 of Set 12 | m

In [10]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Kodiak,57.79,-152.4072,40.51,81,100,6.91,US,2022-03-13 02:41:11
1,Albany,42.6001,-73.9662,19.76,63,80,3.0,US,2022-03-13 02:37:09
2,Castro,-24.7911,-50.0119,61.14,99,100,7.58,BR,2022-03-13 02:41:12
3,Bredasdorp,-34.5322,20.0403,61.92,77,1,3.44,ZA,2022-03-13 02:41:12
4,Nanortalik,60.1432,-45.2371,13.87,69,100,31.56,GL,2022-03-13 02:41:12
5,Hambantota,6.1241,81.1185,75.54,100,20,3.44,LK,2022-03-13 02:41:13
6,Arraial Do Cabo,-22.9661,-42.0278,77.07,90,100,1.66,BR,2022-03-13 02:41:13
7,Clonakilty,51.6231,-8.8706,47.41,86,50,25.72,IE,2022-03-13 02:41:14
8,Rikitea,-23.1203,-134.9692,79.99,71,44,13.35,PF,2022-03-13 02:41:14
9,Pandan,14.0453,124.1694,81.36,82,55,8.43,PH,2022-03-13 02:41:15


In [11]:
# Reorder the column order
new_column_order = ["City", "Country", "Date", "Lat","Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]


In [12]:
city_data_df = city_data_df[new_column_order]

In [13]:
city_data_df

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Kodiak,US,2022-03-13 02:41:11,57.7900,-152.4072,40.51,81,100,6.91
1,Albany,US,2022-03-13 02:37:09,42.6001,-73.9662,19.76,63,80,3.00
2,Castro,BR,2022-03-13 02:41:12,-24.7911,-50.0119,61.14,99,100,7.58
3,Bredasdorp,ZA,2022-03-13 02:41:12,-34.5322,20.0403,61.92,77,1,3.44
4,Nanortalik,GL,2022-03-13 02:41:12,60.1432,-45.2371,13.87,69,100,31.56
...,...,...,...,...,...,...,...,...,...
566,Vyazemskiy,RU,2022-03-13 02:44:55,47.5378,134.7525,29.37,94,100,4.68
567,Yantarnyy,RU,2022-03-13 02:44:55,54.8717,19.9381,21.06,53,0,5.53
568,Maragogi,BR,2022-03-13 02:44:56,-9.0122,-35.2225,79.23,79,99,5.95
569,Kasiri,SL,2022-03-13 02:44:56,8.9412,-13.1148,74.10,85,80,3.69


In [14]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")